{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.7241379310344827, "eval_steps": 500, "global_step": 1800, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0, "loss_full_dim": 27.883209228515625, "loss_main": 56.09363555908203, "loss_parscale": 56.0, "loss_sub_dim": 28.210426330566406, "loss_vclub": 2.86102294921875e-05, "parscale_sim": 0.99609375, "step": 0 }, { "epoch": 0.0009578544061302681, "grad_norm": 544.1687622070312, "learning_rate": 5.0000000000000004e-08, "loss": 56.0936, "step": 1 }, { "epoch": 0.0009578544061302681, "loss_full_dim": 28.56818962097168, "loss_main": 57.451297760009766, "loss_parscale": 57.5, "loss_sub_dim": 28.883108139038086, "loss_vclub": -5.7220458984375e-06, "parscale_sim": 0.9921875, "step": 1 }, { "epoch": 0.0019157088122605363, "grad_norm": 334.72515869140625, "learning_rate": 1.0000000000000001e-07, "loss": 57.4513, "step": 2 }, { "epoch": 0.0019157088122605363, "loss_full_dim": 27.948469161987305, "loss_main": 56.19000244140625, "loss_parscale": 56.0, "loss_sub_dim": 28.241535186767578, "loss_vclub": -1.33514404296875e-05, "parscale_sim": 0.9921875, "step": 2 }, { "epoch": 0.0028735632183908046, "grad_norm": 317.88812255859375, "learning_rate": 1.5000000000000002e-07, "loss": 56.19, "step": 3 }, { "epoch": 0.0028735632183908046, "loss_full_dim": 28.14714241027832, "loss_main": 56.606781005859375, "loss_parscale": 56.5, "loss_sub_dim": 28.459636688232422, "loss_vclub": 1.9073486328125e-06, "parscale_sim": 0.9921875, "step": 3 }, { "epoch": 0.0038314176245210726, "grad_norm": 486.32244873046875, "learning_rate": 2.0000000000000002e-07, "loss": 56.6068, "step": 4 }, { "epoch": 0.0038314176245210726, "loss_full_dim": 26.707256317138672, "loss_main": 53.7358283996582, "loss_parscale": 53.5, "loss_sub_dim": 27.02857208251953, "loss_vclub": 2.288818359375e-05, "parscale_sim": 0.9921875, "step": 4 }, { "epoch": 0.004789272030651341, "grad_norm": 308.9286804199219, "learning_rate": 2.5000000000000004e-07, "loss": 53.7358, "step": 5 }, { "epoch": 0.004789272030651341, "loss_full_dim": 24.470537185668945, "loss_main": 49.20744323730469, "loss_parscale": 49.0, "loss_sub_dim": 24.73690414428711, "loss_vclub": 5.7220458984375e-06, "parscale_sim": 0.98828125, "step": 5 }, { "epoch": 0.005747126436781609, "grad_norm": 361.45697021484375, "learning_rate": 3.0000000000000004e-07, "loss": 49.2074, "step": 6 }, { "epoch": 0.005747126436781609, "loss_full_dim": 20.486265182495117, "loss_main": 41.32176971435547, "loss_parscale": 41.0, "loss_sub_dim": 20.83550262451172, "loss_vclub": 1.33514404296875e-05, "parscale_sim": 0.9921875, "step": 6 }, { "epoch": 0.006704980842911878, "grad_norm": 489.876708984375, "learning_rate": 3.5000000000000004e-07, "loss": 41.3218, "step": 7 }, { "epoch": 0.006704980842911878, "loss_full_dim": 17.867464065551758, "loss_main": 36.07404327392578, "loss_parscale": 36.0, "loss_sub_dim": 18.206579208374023, "loss_vclub": -7.62939453125e-06, "parscale_sim": 0.984375, "step": 7 }, { "epoch": 0.007662835249042145, "grad_norm": 351.1166687011719, "learning_rate": 4.0000000000000003e-07, "loss": 36.074, "step": 8 }, { "epoch": 0.007662835249042145, "loss_full_dim": 13.883452415466309, "loss_main": 28.13947296142578, "loss_parscale": 28.25, "loss_sub_dim": 14.256021499633789, "loss_vclub": 1.52587890625e-05, "parscale_sim": 0.98828125, "step": 8 }, { "epoch": 0.008620689655172414, "grad_norm": 273.4085693359375, "learning_rate": 4.5000000000000003e-07, "loss": 28.1395, "step": 9 }, { "epoch": 0.008620689655172414, "loss_full_dim": 11.522775650024414, "loss_main": 23.46347427368164, "loss_parscale": 23.375, "loss_sub_dim": 11.940699577331543, "loss_vclub": -1.33514404296875e-05, "parscale_sim": 0.984375, "step": 9 }, { "epoch": 0.009578544061302681, "grad_norm": 383.85888671875, "learning_rate": 5.000000000000001e-07, "loss": 23.4635, "step": 10 }, { "epoch": 0.009578544061302681, "loss_full_dim": 9.43447494506836, "loss_main": 19.322315216064453, "loss_parscale": 19.25, "loss_sub_dim": 9.887840270996094, "loss_vclub": -1.1444091796875e-05, "parscale_sim": 0.98828125, "step": 10 }, { "epoch": 0.01053639846743295, "grad_norm": 276.31646728515625, "learning_rate": 5.5e-07, "loss": 19.3223, "step": 11 }, { "epoch": 0.01053639846743295, "loss_full_dim": 8.171350479125977, "loss_main": 16.813720703125, "loss_parscale": 16.75, "loss_sub_dim": 8.642370223999023, "loss_vclub": -3.814697265625e-06, "parscale_sim": 0.97265625, "step": 11 }, { "epoch": 0.011494252873563218, "grad_norm": 759.9069213867188, "learning_rate": 6.000000000000001e-07, "loss": 16.8137, "step": 12 }, { "epoch": 0.011494252873563218, "loss_full_dim": 7.012251853942871, "loss_main": 14.488821029663086, "loss_parscale": 14.5, "loss_sub_dim": 7.476569175720215, "loss_vclub": -3.62396240234375e-05, "parscale_sim": 0.98046875, "step": 12 }, { "epoch": 0.012452107279693486, "grad_norm": 83.51067352294922, "learning_rate": 6.5e-07, "loss": 14.4888, "step": 13 }, { "epoch": 0.012452107279693486, "loss_full_dim": 6.64729642868042, "loss_main": 13.762259483337402, "loss_parscale": 13.75, "loss_sub_dim": 7.114963054656982, "loss_vclub": -5.7220458984375e-06, "parscale_sim": 0.9765625, "step": 13 }, { "epoch": 0.013409961685823755, "grad_norm": 218.7431640625, "learning_rate": 7.000000000000001e-07, "loss": 13.7623, "step": 14 }, { "epoch": 0.013409961685823755, "loss_full_dim": 6.179683685302734, "loss_main": 12.793693542480469, "loss_parscale": 12.8125, "loss_sub_dim": 6.614009380340576, "loss_vclub": 0.0, "parscale_sim": 0.98828125, "step": 14 }, { "epoch": 0.014367816091954023, "grad_norm": 100.04430389404297, "learning_rate": 7.5e-07, "loss": 12.7937, "step": 15 }, { "epoch": 0.014367816091954023, "loss_full_dim": 5.8895697593688965, "loss_main": 12.153852462768555, "loss_parscale": 12.125, "loss_sub_dim": 6.264282703399658, "loss_vclub": -2.09808349609375e-05, "parscale_sim": 0.98828125, "step": 15 }, { "epoch": 0.01532567049808429, "grad_norm": 70.88832092285156, "learning_rate": 8.000000000000001e-07, "loss": 12.1539, "step": 16 }, { "epoch": 0.01532567049808429, "loss_full_dim": 5.517953395843506, "loss_main": 11.450885772705078, "loss_parscale": 11.5, "loss_sub_dim": 5.9329328536987305, "loss_vclub": -5.7220458984375e-06, "parscale_sim": 0.98828125, "step": 16 }, { "epoch": 0.016283524904214558, "grad_norm": 87.37732696533203, "learning_rate": 8.500000000000001e-07, "loss": 11.4509, "step": 17 }, { "epoch": 0.016283524904214558, "loss_full_dim": 6.851534366607666, "loss_main": 14.23066520690918, "loss_parscale": 14.25, "loss_sub_dim": 7.3791303634643555, "loss_vclub": -1.71661376953125e-05, "parscale_sim": 0.98828125, "step": 17 }, { "epoch": 0.017241379310344827, "grad_norm": 50.55602264404297, "learning_rate": 9.000000000000001e-07, "loss": 14.2307, "step": 18 }, { "epoch": 0.017241379310344827, "loss_full_dim": 5.348215579986572, "loss_main": 11.100927352905273, "loss_parscale": 11.125, "loss_sub_dim": 5.752711296081543, "loss_vclub": -1.9073486328125e-06, "parscale_sim": 0.98828125, "step": 18 }, { "epoch": 0.018199233716475097, "grad_norm": 58.99557876586914, "learning_rate": 9.500000000000001e-07, "loss": 11.1009, "step": 19 }, { "epoch": 0.018199233716475097, "loss_full_dim": 4.931085586547852, "loss_main": 10.222579956054688, "loss_parscale": 10.25, "loss_sub_dim": 5.291494369506836, "loss_vclub": 0.0, "parscale_sim": 0.98828125, "step": 19 }, { "epoch": 0.019157088122605363, "grad_norm": 116.5761489868164, "learning_rate": 1.0000000000000002e-06, "loss": 10.2226, "step": 20 }, { "epoch": 0.019157088122605363, "loss_full_dim": 4.620007514953613, "loss_main": 9.643980026245117, "loss_parscale": 9.6875, "loss_sub_dim": 5.023972511291504, "loss_vclub": -1.33514404296875e-05, "parscale_sim": 0.98828125, "step": 20 }, { "epoch": 0.020114942528735632, "grad_norm": 74.11045837402344, "learning_rate": 1.0500000000000001e-06, "loss": 9.644, "step": 21 }, { "epoch": 0.020114942528735632, "loss_full_dim": 4.429300308227539, "loss_main": 9.1763334274292, "loss_parscale": 9.25, "loss_sub_dim": 4.74703311920166, "loss_vclub": 1.33514404296875e-05, "parscale_sim": 0.98828125, "step": 21 }, { "epoch": 0.0210727969348659, "grad_norm": 2042.98095703125, "learning_rate": 1.1e-06, "loss": 9.1763, "step": 22 }, { "epoch": 0.0210727969348659, "loss_full_dim": 4.503853797912598, "loss_main": 9.423707962036133, "loss_parscale": 9.375, "loss_sub_dim": 4.919854164123535, "loss_vclub": -1.1444091796875e-05, "parscale_sim": 0.9921875, "step": 22 }, { "epoch": 0.022030651340996167, "grad_norm": 163.77296447753906, "learning_rate": 1.1500000000000002e-06, "loss": 9.4237, "step": 23 }, { "epoch": 0.022030651340996167, "loss_full_dim": 4.1338605880737305, "loss_main": 8.546049118041992, "loss_parscale": 8.625, "loss_sub_dim": 4.412188529968262, "loss_vclub": 1.52587890625e-05, "parscale_sim": 0.98828125, "step": 23 }, { "epoch": 0.022988505747126436, "grad_norm": 52.15481185913086, "learning_rate": 1.2000000000000002e-06, "loss": 8.546, "step": 24 }, { "epoch": 0.022988505747126436, "loss_full_dim": 3.992586135864258, "loss_main": 8.315573692321777, "loss_parscale": 8.3125, "loss_sub_dim": 4.3229875564575195, "loss_vclub": 1.9073486328125e-06, "parscale_sim": 0.984375, "step": 24 }, { "epoch": 0.023946360153256706, "grad_norm": 66.11255645751953, "learning_rate": 1.25e-06, "loss": 8.3156, "step": 25 }, { "epoch": 0.023946360153256706, "loss_full_dim": 3.771688461303711, "loss_main": 7.815267562866211, "loss_parscale": 7.84375, "loss_sub_dim": 4.0435791015625, "loss_vclub": 1.33514404296875e-05, "parscale_sim": 0.9921875, "step": 25 }, { "epoch": 0.02490421455938697, "grad_norm": 48.1490364074707, "learning_rate": 1.3e-06, "loss": 7.8153, "step": 26 }, { "epoch": 0.02490421455938697, "loss_full_dim": 3.4067771434783936, "loss_main": 7.096142768859863, "loss_parscale": 7.125, "loss_sub_dim": 3.6893653869628906, "loss_vclub": -1.52587890625e-05, "parscale_sim": 0.9921875, "step": 26 }, { "epoch": 0.02586206896551724, "grad_norm": 61.00373077392578, "learning_rate": 1.3500000000000002e-06, "loss": 7.0961, "step": 27 }, { "epoch": 0.02586206896551724, "loss_full_dim": 3.28936767578125, "loss_main": 6.858680248260498, "loss_parscale": 6.84375, "loss_sub_dim": 3.569312572479248, "loss_vclub": 1.9073486328125e-06, "parscale_sim": 0.9921875, "step": 27 }, { "epoch": 0.02681992337164751, "grad_norm": 89.91880798339844, "learning_rate": 1.4000000000000001e-06, "loss": 6.8587, "step": 28 }, { "epoch": 0.02681992337164751, "loss_full_dim": 2.914330005645752, "loss_main": 6.075565338134766, "loss_parscale": 6.09375, "loss_sub_dim": 3.1612353324890137, "loss_vclub": 9.5367431640625e-06, "parscale_sim": 0.9921875, "step": 28 }, { "epoch": 0.027777777777777776, "grad_norm": 59.84787368774414, "learning_rate": 1.45e-06, "loss": 6.0756, "step": 29 }, { "epoch": 0.027777777777777776, "loss_full_dim": 2.7523744106292725, "loss_main": 5.759920120239258, "loss_parscale": 5.75, "loss_sub_dim": 3.0075454711914062, "loss_vclub": 0.0, "parscale_sim": 0.9921875, "step": 29 }, { "epoch": 0.028735632183908046, "grad_norm": 47.231781005859375, "learning_rate": 1.5e-06, "loss": 5.7599, "step": 30 }, { "epoch": 0.028735632183908046, "loss_full_dim": 2.622459650039673, "loss_main": 5.464348793029785, "loss_parscale": 5.5, "loss_sub_dim": 2.8418893814086914, "loss_vclub": -1.9073486328125e-06, "parscale_sim": 0.99609375, "step": 30 }, { "epoch": 0.029693486590038315, "grad_norm": 35.271400451660156, "learning_rate": 1.5500000000000002e-06, "loss": 5.4643, "step": 31 }, { "epoch": 0.029693486590038315, "loss_full_dim": 2.559330940246582, "loss_main": 5.3209991455078125, "loss_parscale": 5.34375, "loss_sub_dim": 2.7616679668426514, "loss_vclub": -1.1444091796875e-05, "parscale_sim": 0.9921875, "step": 31 }, { "epoch": 0.03065134099616858, "grad_norm": 58.45293045043945, "learning_rate": 1.6000000000000001e-06, "loss": 5.321, "step": 32 }, { "epoch": 0.03065134099616858, "loss_full_dim": 2.249798536300659, "loss_main": 4.727456092834473, "loss_parscale": 4.75, "loss_sub_dim": 2.4776573181152344, "loss_vclub": 5.7220458984375e-06, "parscale_sim": 0.9921875, "step": 32 }, { "epoch": 0.031609195402298854, "grad_norm": 30.55335235595703, "learning_rate": 1.6500000000000003e-06, "loss": 4.7275, "step": 33 }, { "epoch": 0.031609195402298854, "loss_full_dim": 2.3825879096984863, "loss_main": 4.949170112609863, "loss_parscale": 4.9375, "loss_sub_dim": 2.566582441329956, "loss_vclub": 1.71661376953125e-05, "parscale_sim": 0.9921875, "step": 33 }, { "epoch": 0.032567049808429116, "grad_norm": 34.073036193847656, "learning_rate": 1.7000000000000002e-06, "loss": 4.9492, "step": 34 }, { "epoch": 0.032567049808429116, "loss_full_dim": 2.236292839050293, "loss_main": 4.68814754486084, "loss_parscale": 4.6875, "loss_sub_dim": 2.451854944229126, "loss_vclub": 9.5367431640625e-06, "parscale_sim": 0.984375, "step": 34 }, { "epoch": 0.033524904214559385, "grad_norm": 88.35596466064453, "learning_rate": 1.75e-06, "loss": 4.6881, "step": 35 }, { "epoch": 0.033524904214559385, "loss_full_dim": 2.186997890472412, "loss_main": 4.557934284210205, "loss_parscale": 4.5625, "loss_sub_dim": 2.370936393737793, "loss_vclub": 2.288818359375e-05, "parscale_sim": 0.99609375, "step": 35 }, { "epoch": 0.034482758620689655, "grad_norm": 39.36273193359375, "learning_rate": 1.8000000000000001e-06, "loss": 4.5579, "step": 36 }, { "epoch": 0.034482758620689655, "loss_full_dim": 2.320162057876587, "loss_main": 4.802684783935547, "loss_parscale": 4.8125, "loss_sub_dim": 2.482522964477539, "loss_vclub": 2.09808349609375e-05, "parscale_sim": 0.9921875, "step": 36 }, { "epoch": 0.035440613026819924, "grad_norm": 27.575183868408203, "learning_rate": 1.85e-06, "loss": 4.8027, "step": 37 }, { "epoch": 0.035440613026819924, "loss_full_dim": 3.195054054260254, "loss_main": 6.606266975402832, "loss_parscale": 6.625, "loss_sub_dim": 3.4112131595611572, "loss_vclub": -1.71661376953125e-05, "parscale_sim": 0.9921875, "step": 37 }, { "epoch": 0.03639846743295019, "grad_norm": 84.62775421142578, "learning_rate": 1.9000000000000002e-06, "loss": 6.6063, "step": 38 }, { "epoch": 0.03639846743295019, "loss_full_dim": 1.9547231197357178, "loss_main": 4.088750839233398, "loss_parscale": 4.09375, "loss_sub_dim": 2.1340279579162598, "loss_vclub": 2.09808349609375e-05, "parscale_sim": 0.98828125, "step": 38 }, { "epoch": 0.03735632183908046, "grad_norm": 38.074546813964844, "learning_rate": 1.9500000000000004e-06, "loss": 4.0888, "step": 39 }, { "epoch": 0.03735632183908046, "loss_full_dim": 2.0766727924346924, "loss_main": 4.309389114379883, "loss_parscale": 4.3125, "loss_sub_dim": 2.2327165603637695, "loss_vclub": -5.7220458984375e-06, "parscale_sim": 0.984375, "step": 39 }, { "epoch": 0.038314176245210725, "grad_norm": 46.0982666015625, "learning_rate": 2.0000000000000003e-06, "loss": 4.3094, "step": 40 }, { "epoch": 0.038314176245210725, "loss_full_dim": 1.9581432342529297, "loss_main": 4.081917762756348, "loss_parscale": 4.0625, "loss_sub_dim": 2.123774290084839, "loss_vclub": -9.5367431640625e-06, "parscale_sim": 0.99609375, "step": 40 }, { "epoch": 0.039272030651340994, "grad_norm": 39.8221435546875, "learning_rate": 2.05e-06, "loss": 4.0819, "step": 41 }, { "epoch": 0.039272030651340994, "loss_full_dim": 1.7684195041656494, "loss_main": 3.7132532596588135, "loss_parscale": 3.75, "loss_sub_dim": 1.944833755493164, "loss_vclub": 5.7220458984375e-06, "parscale_sim": 0.9921875, "step": 41 }, { "epoch": 0.040229885057471264, "grad_norm": 38.747894287109375, "learning_rate": 2.1000000000000002e-06, "loss": 3.7133, "step": 42 }, { "epoch": 0.040229885057471264, "loss_full_dim": 1.9075413942337036, "loss_main": 3.9601874351501465, "loss_parscale": 3.953125, "loss_sub_dim": 2.0526459217071533, "loss_vclub": 3.4332275390625e-05, "parscale_sim": 0.98828125, "step": 42 }, { "epoch": 0.04118773946360153, "grad_norm": 28.218534469604492, "learning_rate": 2.15e-06, "loss": 3.9602, "step": 43 }, { "epoch": 0.04118773946360153, "loss_full_dim": 1.8397352695465088, "loss_main": 3.843639612197876, "loss_parscale": 3.84375, "loss_sub_dim": 2.003904342651367, "loss_vclub": 2.6702880859375e-05, "parscale_sim": 0.9921875, "step": 43 }, { "epoch": 0.0421455938697318, "grad_norm": 36.979461669921875, "learning_rate": 2.2e-06, "loss": 3.8436, "step": 44 }, { "epoch": 0.0421455938697318, "loss_full_dim": 1.7193338871002197, "loss_main": 3.568979263305664, "loss_parscale": 3.5625, "loss_sub_dim": 1.8496453762054443, "loss_vclub": 1.9073486328125e-05, "parscale_sim": 0.9921875, "step": 44 }, { "epoch": 0.04310344827586207, "grad_norm": 28.82156753540039, "learning_rate": 2.25e-06, "loss": 3.569, "step": 45 }, { "epoch": 0.04310344827586207, "loss_full_dim": 1.6388003826141357, "loss_main": 3.394000291824341, "loss_parscale": 3.390625, "loss_sub_dim": 1.755199909210205, "loss_vclub": -3.814697265625e-06, "parscale_sim": 0.9921875, "step": 45 }, { "epoch": 0.044061302681992334, "grad_norm": 26.69896697998047, "learning_rate": 2.3000000000000004e-06, "loss": 3.394, "step": 46 }, { "epoch": 0.044061302681992334, "loss_full_dim": 1.6422910690307617, "loss_main": 3.403944492340088, "loss_parscale": 3.421875, "loss_sub_dim": 1.7616533041000366, "loss_vclub": 3.62396240234375e-05, "parscale_sim": 0.984375, "step": 46 }, { "epoch": 0.045019157088122604, "grad_norm": 26.755311965942383, "learning_rate": 2.35e-06, "loss": 3.4039, "step": 47 }, { "epoch": 0.045019157088122604, "loss_full_dim": 1.5500622987747192, "loss_main": 3.2283248901367188, "loss_parscale": 3.25, "loss_sub_dim": 1.67826247215271, "loss_vclub": -2.6702880859375e-05, "parscale_sim": 0.9921875, "step": 47 }, { "epoch": 0.04597701149425287, "grad_norm": 26.591873168945312, "learning_rate": 2.4000000000000003e-06, "loss": 3.2283, "step": 48 }, { "epoch": 0.04597701149425287, "loss_full_dim": 1.6151713132858276, "loss_main": 3.342273235321045, "loss_parscale": 3.3125, "loss_sub_dim": 1.7271019220352173, "loss_vclub": 5.7220458984375e-06, "parscale_sim": 0.9921875, "step": 48 }, { "epoch": 0.04693486590038314, "grad_norm": 23.952716827392578, "learning_rate": 2.4500000000000003e-06, "loss": 3.3423, "step": 49 }, { "epoch": 0.04693486590038314, "loss_full_dim": 1.5720106363296509, "loss_main": 3.262500762939453, "loss_parscale": 3.28125, "loss_sub_dim": 1.6904902458190918, "loss_vclub": 5.7220458984375e-06, "parscale_sim": 0.9921875, "step": 49 }, { "epoch": 0.04789272030651341, "grad_norm": 35.36857986450195, "learning_rate": 2.5e-06, "loss": 3.2625, "step": 50 }, { "epoch": 0.04789272030651341, "loss_full_dim": 1.7535868883132935, "loss_main": 3.637054920196533, "loss_parscale": 3.609375, "loss_sub_dim": 1.8834681510925293, "loss_vclub": -1.9073486328125e-06, "parscale_sim": 0.984375, "step": 50 }, { "epoch": 0.04885057471264368, "grad_norm": 31.500146865844727, "learning_rate": 2.55e-06, "loss": 3.6371, "step": 51 }, { "epoch": 0.04885057471264368, "loss_full_dim": 1.5265578031539917, "loss_main": 3.1539828777313232, "loss_parscale": 3.15625, "loss_sub_dim": 1.6274250745773315, "loss_vclub": 3.0517578125e-05, "parscale_sim": 0.98046875, "step": 51 }, { "epoch": 0.04980842911877394, "grad_norm": 46.449588775634766, "learning_rate": 2.6e-06, "loss": 3.154, "step": 52 }, { "epoch": 0.04980842911877394, "loss_full_dim": 1.515243411064148, "loss_main": 3.142493724822998, "loss_parscale": 3.125, "loss_sub_dim": 1.6272501945495605, "loss_vclub": 0.0, "parscale_sim": 0.9921875, "step": 52 }, { "epoch": 0.05076628352490421, "grad_norm": 29.402326583862305, "learning_rate": 2.6500000000000005e-06, "loss": 3.1425, "step": 53 }, { "epoch": 0.05076628352490421, "loss_full_dim": 1.302185297012329, "loss_main": 2.711179256439209, "loss_parscale": 2.71875, "loss_sub_dim": 1.4089940786361694, "loss_vclub": 3.4332275390625e-05, "parscale_sim": 0.98046875, "step": 53 }, { "epoch": 0.05172413793103448, "grad_norm": 21.509185791015625, "learning_rate": 2.7000000000000004e-06, "loss": 2.7112, "step": 54 }, { "epoch": 0.05172413793103448, "loss_full_dim": 1.3309576511383057, "loss_main": 2.7577123641967773, "loss_parscale": 2.75, "loss_sub_dim": 1.4267548322677612, "loss_vclub": 2.86102294921875e-05, "parscale_sim": 0.984375, "step": 54 }, { "epoch": 0.05268199233716475, "grad_norm": 21.17945671081543, "learning_rate": 2.7500000000000004e-06, "loss": 2.7577, "step": 55 }, { "epoch": 0.05268199233716475, "loss_full_dim": 1.2117403745651245, "loss_main": 2.514101982116699, "loss_parscale": 2.5, "loss_sub_dim": 1.3023617267608643, "loss_vclub": 5.7220458984375e-06, "parscale_sim": 0.9921875, "step": 55 }, { "epoch": 0.05363984674329502, "grad_norm": 96.6557846069336, "learning_rate": 2.8000000000000003e-06, "loss": 2.5141, "step": 56 }, { "epoch": 0.05363984674329502, "loss_full_dim": 1.2082308530807495, "loss_main": 2.4996585845947266, "loss_parscale": 2.5, "loss_sub_dim": 1.2914276123046875, "loss_vclub": 3.0517578125e-05, "parscale_sim": 0.9921875, "step": 56 }, { "epoch": 0.05459770114942529, "grad_norm": 97.51107788085938, "learning_rate": 2.85e-06, "loss": 2.4997, "step": 57 }, { "epoch": 0.05459770114942529, "loss_full_dim": 1.2508951425552368, "loss_main": 2.597651720046997, "loss_parscale": 2.59375, "loss_sub_dim": 1.3467565774917603, "loss_vclub": 1.52587890625e-05, "parscale_sim": 0.9921875, "step": 57 }, { "epoch": 0.05555555555555555, "grad_norm": 19.01352310180664, "learning_rate": 2.9e-06, "loss": 2.5977, "step": 58 }, { "epoch": 0.05555555555555555, "loss_full_dim": 1.233282446861267, "loss_main": 2.547071695327759, "loss_parscale": 2.546875, "loss_sub_dim": 1.3137892484664917, "loss_vclub": 5.7220458984375e-06, "parscale_sim": 0.98828125, "step": 58 }, { "epoch": 0.05651340996168582, "grad_norm": 30.410297393798828, "learning_rate": 2.95e-06, "loss": 2.5471, "step": 59 }, { "epoch": 0.05651340996168582, "loss_full_dim": 1.2544177770614624, "loss_main": 2.5948238372802734, "loss_parscale": 2.59375, "loss_sub_dim": 1.3404061794281006, "loss_vclub": 3.814697265625e-05, "parscale_sim": 0.99609375, "step": 59 }, { "epoch": 0.05747126436781609, "grad_norm": 26.40641212463379, "learning_rate": 3e-06, "loss": 2.5948, "step": 60 }, { "epoch": 0.05747126436781609, "loss_full_dim": 1.227527379989624, "loss_main": 2.5344841480255127, "loss_parscale": 2.53125, "loss_sub_dim": 1.3069567680358887, "loss_vclub": 3.0517578125e-05, "parscale_sim": 0.9921875, "step": 60 }, { "epoch": 0.05842911877394636, "grad_norm": 19.4179744720459, "learning_rate": 3.05e-06, "loss": 2.5345, "step": 61 }, { "epoch": 0.05842911877394636, "loss_full_dim": 1.1664669513702393, "loss_main": 2.42323637008667, "loss_parscale": 2.40625, "loss_sub_dim": 1.2567694187164307, "loss_vclub": 5.14984130859375e-05, "parscale_sim": 0.9921875, "step": 61 }, { "epoch": 0.05938697318007663, "grad_norm": 33.37090301513672, "learning_rate": 3.1000000000000004e-06, "loss": 2.4232, "step": 62 }, { "epoch": 0.05938697318007663, "loss_full_dim": 1.33584463596344, "loss_main": 2.7449498176574707, "loss_parscale": 2.75, "loss_sub_dim": 1.4091050624847412, "loss_vclub": 1.71661376953125e-05, "parscale_sim": 0.9921875, "step": 62 }, { "epoch": 0.0603448275862069, "grad_norm": 26.98957633972168, "learning_rate": 3.1500000000000003e-06, "loss": 2.7449, "step": 63 }, { "epoch": 0.0603448275862069, "loss_full_dim": 1.1889444589614868, "loss_main": 2.4392547607421875, "loss_parscale": 2.4375, "loss_sub_dim": 1.2503103017807007, "loss_vclub": 4.00543212890625e-05, "parscale_sim": 0.98828125, "step": 63 }, { "epoch": 0.06130268199233716, "grad_norm": 20.963672637939453, "learning_rate": 3.2000000000000003e-06, "loss": 2.4393, "step": 64 }, { "epoch": 0.06130268199233716, "loss_full_dim": 1.086988925933838, "loss_main": 2.2535557746887207, "loss_parscale": 2.265625, "loss_sub_dim": 1.1665667295455933, "loss_vclub": 1.9073486328125e-05, "parscale_sim": 0.9921875, "step": 64 }, { "epoch": 0.06226053639846743, "grad_norm": 29.975191116333008, "learning_rate": 3.2500000000000002e-06, "loss": 2.2536, "step": 65 }, { "epoch": 0.06226053639846743, "loss_full_dim": 1.1808075904846191, "loss_main": 2.439089298248291, "loss_parscale": 2.46875, "loss_sub_dim": 1.2582818269729614, "loss_vclub": 2.47955322265625e-05, "parscale_sim": 0.98828125, "step": 65 }, { "epoch": 0.06321839080459771, "grad_norm": 24.438688278198242, "learning_rate": 3.3000000000000006e-06, "loss": 2.4391, "step": 66 }, { "epoch": 0.06321839080459771, "loss_full_dim": 1.1956560611724854, "loss_main": 2.4795889854431152, "loss_parscale": 2.46875, "loss_sub_dim": 1.2839329242706299, "loss_vclub": 5.7220458984375e-06, "parscale_sim": 0.98828125, "step": 66 }, { "epoch": 0.06417624521072797, "grad_norm": 37.03203201293945, "learning_rate": 3.3500000000000005e-06, "loss": 2.4796, "step": 67 }, { "epoch": 0.06417624521072797, "loss_full_dim": 1.094626784324646, "loss_main": 2.2590057849884033, "loss_parscale": 2.25, "loss_sub_dim": 1.1643790006637573, "loss_vclub": 2.288818359375e-05, "parscale_sim": 0.9921875, "step": 67 }, { "epoch": 0.06513409961685823, "grad_norm": 24.15251922607422, "learning_rate": 3.4000000000000005e-06, "loss": 2.259, "step": 68 }, { "epoch": 0.06513409961685823, "loss_full_dim": 1.068907380104065, "loss_main": 2.199707508087158, "loss_parscale": 2.21875, "loss_sub_dim": 1.1308002471923828, "loss_vclub": 5.340576171875e-05, "parscale_sim": 0.98828125, "step": 68 }, { "epoch": 0.06609195402298851, "grad_norm": 21.34566879272461, "learning_rate": 3.45e-06, "loss": 2.1997, "step": 69 }, { "epoch": 0.06609195402298851, "loss_full_dim": 0.9918674230575562, "loss_main": 2.050957679748535, "loss_parscale": 2.046875, "loss_sub_dim": 1.0590901374816895, "loss_vclub": 3.62396240234375e-05, "parscale_sim": 0.9921875, "step": 69 }, { "epoch": 0.06704980842911877, "grad_norm": 17.175941467285156, "learning_rate": 3.5e-06, "loss": 2.051, "step": 70 }, { "epoch": 0.06704980842911877, "loss_full_dim": 1.0565348863601685, "loss_main": 2.176116943359375, "loss_parscale": 2.1875, "loss_sub_dim": 1.119581937789917, "loss_vclub": 4.9591064453125e-05, "parscale_sim": 0.9921875, "step": 70 }, { "epoch": 0.06800766283524905, "grad_norm": 17.343780517578125, "learning_rate": 3.5500000000000003e-06, "loss": 2.1761, "step": 71 }, { "epoch": 0.06800766283524905, "loss_full_dim": 0.922068178653717, "loss_main": 1.9063405990600586, "loss_parscale": 1.90625, "loss_sub_dim": 0.9842724800109863, "loss_vclub": 3.814697265625e-05, "parscale_sim": 0.9921875, "step": 71 }, { "epoch": 0.06896551724137931, "grad_norm": 17.621437072753906, "learning_rate": 3.6000000000000003e-06, "loss": 1.9063, "step": 72 }, { "epoch": 0.06896551724137931, "loss_full_dim": 0.9338617324829102, "loss_main": 1.9262635707855225, "loss_parscale": 1.921875, "loss_sub_dim": 0.9924018383026123, "loss_vclub": 6.4849853515625e-05, "parscale_sim": 0.9921875, "step": 72 }, { "epoch": 0.06992337164750957, "grad_norm": 19.96275520324707, "learning_rate": 3.65e-06, "loss": 1.9263, "step": 73 }, { "epoch": 0.06992337164750957, "loss_full_dim": 0.9866521954536438, "loss_main": 2.025604724884033, "loss_parscale": 2.046875, "loss_sub_dim": 1.0389525890350342, "loss_vclub": 5.91278076171875e-05, "parscale_sim": 0.9921875, "step": 73 }, { "epoch": 0.07088122605363985, "grad_norm": 16.729263305664062, "learning_rate": 3.7e-06, "loss": 2.0256, "step": 74 }, { "epoch": 0.07088122605363985, "loss_full_dim": 0.903300404548645, "loss_main": 1.8610045909881592, "loss_parscale": 1.859375, "loss_sub_dim": 0.9577041864395142, "loss_vclub": 2.6702880859375e-05, "parscale_sim": 0.9921875, "step": 74 }, { "epoch": 0.07183908045977011, "grad_norm": 19.866695404052734, "learning_rate": 3.7500000000000005e-06, "loss": 1.861, "step": 75 }, { "epoch": 0.07183908045977011, "loss_full_dim": 0.9628086686134338, "loss_main": 1.9816994667053223, "loss_parscale": 1.984375, "loss_sub_dim": 1.0188908576965332, "loss_vclub": 4.38690185546875e-05, "parscale_sim": 0.9921875, "step": 75 }, { "epoch": 0.07279693486590039, "grad_norm": 20.1734561920166, "learning_rate": 3.8000000000000005e-06, "loss": 1.9817, "step": 76 }, { "epoch": 0.07279693486590039, "loss_full_dim": 0.9500946998596191, "loss_main": 1.9420944452285767, "loss_parscale": 1.9453125, "loss_sub_dim": 0.9919997453689575, "loss_vclub": 4.00543212890625e-05, "parscale_sim": 0.98828125, "step": 76 }, { "epoch": 0.07375478927203065, "grad_norm": 15.909680366516113, "learning_rate": 3.85e-06, "loss": 1.9421, "step": 77 }, { "epoch": 0.07375478927203065, "loss_full_dim": 0.922800600528717, "loss_main": 1.896266222000122, "loss_parscale": 1.8984375, "loss_sub_dim": 0.9734656810760498, "loss_vclub": 4.00543212890625e-05, "parscale_sim": 0.9921875, "step": 77 }, { "epoch": 0.07471264367816093, "grad_norm": 21.93893814086914, "learning_rate": 3.900000000000001e-06, "loss": 1.8963, "step": 78 }, { "epoch": 0.07471264367816093, "loss_full_dim": 0.9844490885734558, "loss_main": 2.023993730545044, "loss_parscale": 2.03125, "loss_sub_dim": 1.0395445823669434, "loss_vclub": 8.58306884765625e-05, "parscale_sim": 0.9921875, "step": 78 }, { "epoch": 0.07567049808429119, "grad_norm": 14.004870414733887, "learning_rate": 3.95e-06, "loss": 2.024, "step": 79 }, { "epoch": 0.07567049808429119, "loss_full_dim": 0.8736144304275513, "loss_main": 1.7916176319122314, "loss_parscale": 1.78125, "loss_sub_dim": 0.9180032014846802, "loss_vclub": 2.47955322265625e-05, "parscale_sim": 0.9921875, "step": 79 }, { "epoch": 0.07662835249042145, "grad_norm": 14.889060020446777, "learning_rate": 4.000000000000001e-06, "loss": 1.7916, "step": 80 }, { "epoch": 0.07662835249042145, "loss_full_dim": 0.972407877445221, "loss_main": 1.99755859375, "loss_parscale": 2.015625, "loss_sub_dim": 1.0251506567001343, "loss_vclub": 4.00543212890625e-05, "parscale_sim": 0.9921875, "step": 80 }, { "epoch": 0.07758620689655173, "grad_norm": 12.796154975891113, "learning_rate": 4.05e-06, "loss": 1.9976, "step": 81 }, { "epoch": 0.07758620689655173, "loss_full_dim": 0.8467214107513428, "loss_main": 1.7426525354385376, "loss_parscale": 1.75, "loss_sub_dim": 0.8959311246871948, "loss_vclub": 7.2479248046875e-05, "parscale_sim": 0.99609375, "step": 81 }, { "epoch": 0.07854406130268199, "grad_norm": 14.5369291305542, "learning_rate": 4.1e-06, "loss": 1.7427, "step": 82 }, { "epoch": 0.07854406130268199, "loss_full_dim": 0.9794785976409912, "loss_main": 2.012943983078003, "loss_parscale": 2.03125, "loss_sub_dim": 1.0334653854370117, "loss_vclub": 6.29425048828125e-05, "parscale_sim": 0.9921875, "step": 82 }, { "epoch": 0.07950191570881227, "grad_norm": 20.860658645629883, "learning_rate": 4.15e-06, "loss": 2.0129, "step": 83 }, { "epoch": 0.07950191570881227, "loss_full_dim": 0.834812581539154, "loss_main": 1.724219799041748, "loss_parscale": 1.71875, "loss_sub_dim": 0.889407217502594, "loss_vclub": 6.29425048828125e-05, "parscale_sim": 0.9921875, "step": 83 }, { "epoch": 0.08045977011494253, "grad_norm": 15.067578315734863, "learning_rate": 4.2000000000000004e-06, "loss": 1.7242, "step": 84 }, { "epoch": 0.08045977011494253, "loss_full_dim": 0.9339824318885803, "loss_main": 1.9146215915679932, "loss_parscale": 1.90625, "loss_sub_dim": 0.9806392192840576, "loss_vclub": 7.2479248046875e-05, "parscale_sim": 0.9921875, "step": 84 }, { "epoch": 0.08141762452107279, "grad_norm": 13.93713092803955, "learning_rate": 4.25e-06, "loss": 1.9146, "step": 85 }, { "epoch": 0.08141762452107279, "loss_full_dim": 1.0739879608154297, "loss_main": 2.202474594116211, "loss_parscale": 2.203125, "loss_sub_dim": 1.1284865140914917, "loss_vclub": 7.62939453125e-05, "parscale_sim": 0.98828125, "step": 85 }, { "epoch": 0.08237547892720307, "grad_norm": 12.566777229309082, "learning_rate": 4.3e-06, "loss": 2.2025, "step": 86 }, { "epoch": 0.08237547892720307, "loss_full_dim": 0.943613588809967, "loss_main": 1.9370012283325195, "loss_parscale": 1.9375, "loss_sub_dim": 0.9933876991271973, "loss_vclub": 4.57763671875e-05, "parscale_sim": 0.9921875, "step": 86 }, { "epoch": 0.08333333333333333, "grad_norm": 108.27618408203125, "learning_rate": 4.350000000000001e-06, "loss": 1.937, "step": 87 }, { "epoch": 0.08333333333333333, "loss_full_dim": 0.9043827652931213, "loss_main": 1.853740930557251, "loss_parscale": 1.828125, "loss_sub_dim": 0.9493582248687744, "loss_vclub": 7.62939453125e-06, "parscale_sim": 0.9921875, "step": 87 }, { "epoch": 0.0842911877394636, "grad_norm": 14.024806022644043, "learning_rate": 4.4e-06, "loss": 1.8537, "step": 88 }, { "epoch": 0.0842911877394636, "loss_full_dim": 0.8512803912162781, "loss_main": 1.7433929443359375, "loss_parscale": 1.75, "loss_sub_dim": 0.8921125531196594, "loss_vclub": 4.76837158203125e-05, "parscale_sim": 0.9921875, "step": 88 }, { "epoch": 0.08524904214559387, "grad_norm": 18.250303268432617, "learning_rate": 4.450000000000001e-06, "loss": 1.7434, "step": 89 }, { "epoch": 0.08524904214559387, "loss_full_dim": 0.8732202053070068, "loss_main": 1.7870060205459595, "loss_parscale": 1.78125, "loss_sub_dim": 0.9137858152389526, "loss_vclub": 5.340576171875e-05, "parscale_sim": 0.9921875, "step": 89 }, { "epoch": 0.08620689655172414, "grad_norm": 14.250292778015137, "learning_rate": 4.5e-06, "loss": 1.787, "step": 90 }, { "epoch": 0.08620689655172414, "loss_full_dim": 0.8922809362411499, "loss_main": 1.8292337656021118, "loss_parscale": 1.8359375, "loss_sub_dim": 0.9369528293609619, "loss_vclub": 0.0001068115234375, "parscale_sim": 0.9921875, "step": 90 }, { "epoch": 0.0871647509578544, "grad_norm": 22.04933738708496, "learning_rate": 4.5500000000000005e-06, "loss": 1.8292, "step": 91 }, { "epoch": 0.0871647509578544, "loss_full_dim": 0.7890886664390564, "loss_main": 1.6206588745117188, "loss_parscale": 1.609375, "loss_sub_dim": 0.8315701484680176, "loss_vclub": 0.0001010894775390625, "parscale_sim": 0.9921875, "step": 91 }, { "epoch": 0.08812260536398467, "grad_norm": 12.014373779296875, "learning_rate": 4.600000000000001e-06, "loss": 1.6207, "step": 92 }, { "epoch": 0.08812260536398467, "loss_full_dim": 0.8630169034004211, "loss_main": 1.7684544324874878, "loss_parscale": 1.7578125, "loss_sub_dim": 0.9054375290870667, "loss_vclub": 8.96453857421875e-05, "parscale_sim": 0.984375, "step": 92 }, { "epoch": 0.08908045977011494, "grad_norm": 14.303446769714355, "learning_rate": 4.65e-06, "loss": 1.7685, "step": 93 }, { "epoch": 0.08908045977011494, "loss_full_dim": 0.8983889818191528, "loss_main": 1.8426650762557983, "loss_parscale": 1.859375, "loss_sub_dim": 0.9442760944366455, "loss_vclub": 9.918212890625e-05, "parscale_sim": 0.9921875, "step": 93 }, { "epoch": 0.09003831417624521, "grad_norm": 22.283117294311523, "learning_rate": 4.7e-06, "loss": 1.8427, "step": 94 }, { "epoch": 0.09003831417624521, "loss_full_dim": 0.893531858921051, "loss_main": 1.828042984008789, "loss_parscale": 1.8203125, "loss_sub_dim": 0.9345111846923828, "loss_vclub": 6.29425048828125e-05, "parscale_sim": 0.9921875, "step": 94 }, { "epoch": 0.09099616858237548, "grad_norm": 13.083138465881348, "learning_rate": 4.75e-06, "loss": 1.828, "step": 95 }, { "epoch": 0.09099616858237548, "loss_full_dim": 0.8189941048622131, "loss_main": 1.6827774047851562, "loss_parscale": 1.6875, "loss_sub_dim": 0.8637832403182983, "loss_vclub": 7.43865966796875e-05, "parscale_sim": 0.9921875, "step": 95 }, { "epoch": 0.09195402298850575, "grad_norm": 13.438131332397461, "learning_rate": 4.800000000000001e-06, "loss": 1.6828, "step": 96 }, { "epoch": 0.09195402298850575, "loss_full_dim": 0.8476383686065674, "loss_main": 1.7282662391662598, "loss_parscale": 1.7421875, "loss_sub_dim": 0.8806278109550476, "loss_vclub": 9.72747802734375e-05, "parscale_sim": 0.98828125, "step": 96 }, { "epoch": 0.09291187739463602, "grad_norm": 19.76914405822754, "learning_rate": 4.85e-06, "loss": 1.7283, "step": 97 }, { "epoch": 0.09291187739463602, "loss_full_dim": 0.8239279389381409, "loss_main": 1.6969246864318848, "loss_parscale": 1.6875, "loss_sub_dim": 0.8729968070983887, "loss_vclub": 9.72747802734375e-05, "parscale_sim": 0.9921875, "step": 97 }, { "epoch": 0.09386973180076628, "grad_norm": 18.77296257019043, "learning_rate": 4.9000000000000005e-06, "loss": 1.6969, "step": 98 }, { "epoch": 0.09386973180076628, "loss_full_dim": 0.7481899261474609, "loss_main": 1.5418051481246948, "loss_parscale": 1.5390625, "loss_sub_dim": 0.7936152219772339, "loss_vclub": 0.0001087188720703125, "parscale_sim": 0.98828125, "step": 98 }, { "epoch": 0.09482758620689655, "grad_norm": 13.750653266906738, "learning_rate": 4.95e-06, "loss": 1.5418, "step": 99 }, { "epoch": 0.09482758620689655, "loss_full_dim": 0.8148187398910522, "loss_main": 1.6614495515823364, "loss_parscale": 1.671875, "loss_sub_dim": 0.8466308116912842, "loss_vclub": 9.5367431640625e-05, "parscale_sim": 0.9921875, "step": 99 }, { "epoch": 0.09578544061302682, "grad_norm": 12.095931053161621, "learning_rate": 5e-06, "loss": 1.6614, "step": 100 }, { "epoch": 0.09578544061302682, "loss_full_dim": 0.7543656826019287, "loss_main": 1.544918179512024, "loss_parscale": 1.546875, "loss_sub_dim": 0.7905524969100952, "loss_vclub": 7.82012939453125e-05, "parscale_sim": 0.9921875, "step": 100 }, { "epoch": 0.09674329501915709, "grad_norm": 17.634353637695312, "learning_rate": 4.9973684210526316e-06, "loss": 1.5449, "step": 101 }, { "epoch": 0.09674329501915709, "loss_full_dim": 0.7316312789916992, "loss_main": 1.4998822212219238, "loss_parscale": 1.4921875, "loss_sub_dim": 0.7682509422302246, "loss_vclub": 9.918212890625e-05, "parscale_sim": 0.9921875, "step": 101 }, { "epoch": 0.09770114942528736, "grad_norm": 22.647031784057617, "learning_rate": 4.9947368421052636e-06, "loss": 1.4999, "step": 102 }, { "epoch": 0.09770114942528736, "loss_full_dim": 0.7207196354866028, "loss_main": 1.4751946926116943, "loss_parscale": 1.4765625, "loss_sub_dim": 0.7544751167297363, "loss_vclub": 6.866455078125e-05, "parscale_sim": 0.9921875, "step": 102 }, { "epoch": 0.09865900383141762, "grad_norm": 11.342265129089355, "learning_rate": 4.992105263157896e-06, "loss": 1.4752, "step": 103 }, { "epoch": 0.09865900383141762, "loss_full_dim": 0.7307630777359009, "loss_main": 1.4944946765899658, "loss_parscale": 1.5, "loss_sub_dim": 0.7637315392494202, "loss_vclub": 9.1552734375e-05, "parscale_sim": 0.9921875, "step": 103 }, { "epoch": 0.09961685823754789, "grad_norm": 14.41549015045166, "learning_rate": 4.989473684210527e-06, "loss": 1.4945, "step": 104 }, { "epoch": 0.09961685823754789, "loss_full_dim": 0.7004854679107666, "loss_main": 1.432535171508789, "loss_parscale": 1.421875, "loss_sub_dim": 0.7320497632026672, "loss_vclub": 0.0001125335693359375, "parscale_sim": 0.9921875, "step": 104 }, { "epoch": 0.10057471264367816, "grad_norm": 10.736408233642578, "learning_rate": 4.986842105263158e-06, "loss": 1.4325, "step": 105 }, { "epoch": 0.10057471264367816, "loss_full_dim": 0.6895180344581604, "loss_main": 1.4139559268951416, "loss_parscale": 1.4375, "loss_sub_dim": 0.7244378328323364, "loss_vclub": 8.96453857421875e-05, "parscale_sim": 0.98828125, "step": 105 }, { "epoch": 0.10153256704980843, "grad_norm": 14.084941864013672, "learning_rate": 4.98421052631579e-06, "loss": 1.414, "step": 106 }, { "epoch": 0.10153256704980843, "loss_full_dim": 0.6567285060882568, "loss_main": 1.3421680927276611, "loss_parscale": 1.34375, "loss_sub_dim": 0.6854395270347595, "loss_vclub": 0.0001239776611328125, "parscale_sim": 0.98046875, "step": 106 }, { "epoch": 0.1024904214559387, "grad_norm": 10.690167427062988, "learning_rate": 4.981578947368422e-06, "loss": 1.3422, "step": 107 }, { "epoch": 0.1024904214559387, "loss_full_dim": 0.7029094696044922, "loss_main": 1.4382234811782837, "loss_parscale": 1.453125, "loss_sub_dim": 0.7353140115737915, "loss_vclub": 0.0001392364501953125, "parscale_sim": 0.99609375, "step": 107 }, { "epoch": 0.10344827586206896, "grad_norm": 19.997657775878906, "learning_rate": 4.978947368421053e-06, "loss": 1.4382, "step": 108 }, { "epoch": 0.10344827586206896, "loss_full_dim": 0.7794752717018127, "loss_main": 1.60068678855896, "loss_parscale": 1.609375, "loss_sub_dim": 0.8212114572525024, "loss_vclub": 0.0001373291015625, "parscale_sim": 0.98828125, "step": 108 }, { "epoch": 0.10440613026819924, "grad_norm": 18.109922409057617, "learning_rate": 4.976315789473685e-06, "loss": 1.6007, "step": 109 }, { "epoch": 0.10440613026819924, "loss_full_dim": 0.721717894077301, "loss_main": 1.4776599407196045, "loss_parscale": 1.484375, "loss_sub_dim": 0.7559419870376587, "loss_vclub": 0.0001621246337890625, "parscale_sim": 0.98828125, "step": 109 }, { "epoch": 0.1053639846743295, "grad_norm": 11.94052791595459, "learning_rate": 4.973684210526316e-06, "loss": 1.4777, "step": 110 }, { "epoch": 0.1053639846743295, "loss_full_dim": 0.7945519089698792, "loss_main": 1.627589225769043, "loss_parscale": 1.625, "loss_sub_dim": 0.833037257194519, "loss_vclub": 0.000133514404296875, "parscale_sim": 0.9921875, "step": 110 }, { "epoch": 0.10632183908045977, "grad_norm": 33.03120040893555, "learning_rate": 4.971052631578947e-06, "loss": 1.6276, "step": 111 }, { "epoch": 0.10632183908045977, "loss_full_dim": 0.873437225818634, "loss_main": 1.7834954261779785, "loss_parscale": 1.78125, "loss_sub_dim": 0.9100581407546997, "loss_vclub": 0.000125885009765625, "parscale_sim": 0.9921875, "step": 111 }, { "epoch": 0.10727969348659004, "grad_norm": 12.37429141998291, "learning_rate": 4.968421052631579e-06, "loss": 1.7835, "step": 112 }, { "epoch": 0.10727969348659004, "loss_full_dim": 0.7109987735748291, "loss_main": 1.4560941457748413, "loss_parscale": 1.453125, "loss_sub_dim": 0.7450953722000122, "loss_vclub": 0.000102996826171875, "parscale_sim": 0.9921875, "step": 112 }, { "epoch": 0.1082375478927203, "grad_norm": 12.282116889953613, "learning_rate": 4.965789473684211e-06, "loss": 1.4561, "step": 113 }, { "epoch": 0.1082375478927203, "loss_full_dim": 0.7198029160499573, "loss_main": 1.4745891094207764, "loss_parscale": 1.484375, "loss_sub_dim": 0.7547861337661743, "loss_vclub": 0.00014495849609375, "parscale_sim": 0.9921875, "step": 113 }, { "epoch": 0.10919540229885058, "grad_norm": 11.182510375976562, "learning_rate": 4.9631578947368426e-06, "loss": 1.4746, "step": 114 }, { "epoch": 0.10919540229885058, "loss_full_dim": 0.7248029112815857, "loss_main": 1.4806857109069824, "loss_parscale": 1.484375, "loss_sub_dim": 0.7558828592300415, "loss_vclub": 0.0001373291015625, "parscale_sim": 0.984375, "step": 114 }, { "epoch": 0.11015325670498084, "grad_norm": 99.17288970947266, "learning_rate": 4.960526315789474e-06, "loss": 1.4807, "step": 115 }, { "epoch": 0.11015325670498084, "loss_full_dim": 0.7763408422470093, "loss_main": 1.5844740867614746, "loss_parscale": 1.609375, "loss_sub_dim": 0.8081332445144653, "loss_vclub": 0.0001735687255859375, "parscale_sim": 0.9921875, "step": 115 }, { "epoch": 0.1111111111111111, "grad_norm": 14.307147026062012, "learning_rate": 4.957894736842106e-06, "loss": 1.5845, "step": 116 }, { "epoch": 0.1111111111111111, "loss_full_dim": 0.7277243137359619, "loss_main": 1.4868676662445068, "loss_parscale": 1.484375, "loss_sub_dim": 0.7591433525085449, "loss_vclub": 0.0001506805419921875, "parscale_sim": 0.9921875, "step": 116 }, { "epoch": 0.11206896551724138, "grad_norm": 9.754802703857422, "learning_rate": 4.955263157894738e-06, "loss": 1.4869, "step": 117 }, { "epoch": 0.11206896551724138, "loss_full_dim": 0.6496493816375732, "loss_main": 1.327056646347046, "loss_parscale": 1.3359375, "loss_sub_dim": 0.6774072051048279, "loss_vclub": 0.00015354156494140625, "parscale_sim": 0.98828125, "step": 117 }, { "epoch": 0.11302681992337164, "grad_norm": 10.07922649383545, "learning_rate": 4.952631578947369e-06, "loss": 1.3271, "step": 118 }, { "epoch": 0.11302681992337164, "loss_full_dim": 0.7423624396324158, "loss_main": 1.515878677368164, "loss_parscale": 1.515625, "loss_sub_dim": 0.7735162377357483, "loss_vclub": 0.0002040863037109375, "parscale_sim": 0.98828125, "step": 118 }, { "epoch": 0.11398467432950192, "grad_norm": 10.377202987670898, "learning_rate": 4.95e-06, "loss": 1.5159, "step": 119 }, { "epoch": 0.11398467432950192, "loss_full_dim": 0.770447850227356, "loss_main": 1.5748106241226196, "loss_parscale": 1.59375, "loss_sub_dim": 0.8043627738952637, "loss_vclub": 0.000171661376953125, "parscale_sim": 0.9921875, "step": 119 }, { "epoch": 0.11494252873563218, "grad_norm": 8.92409896850586, "learning_rate": 4.947368421052632e-06, "loss": 1.5748, "step": 120 }, { "epoch": 0.11494252873563218, "loss_full_dim": 0.7731048464775085, "loss_main": 1.576432704925537, "loss_parscale": 1.578125, "loss_sub_dim": 0.8033279180526733, "loss_vclub": 0.00015735626220703125, "parscale_sim": 0.98828125, "step": 120 }, { "epoch": 0.11590038314176246, "grad_norm": 12.691407203674316, "learning_rate": 4.944736842105264e-06, "loss": 1.5764, "step": 121 }, { "epoch": 0.11590038314176246, "loss_full_dim": 0.7525403499603271, "loss_main": 1.5349661111831665, "loss_parscale": 1.53125, "loss_sub_dim": 0.7824257612228394, "loss_vclub": 0.000171661376953125, "parscale_sim": 0.98828125, "step": 121 }, { "epoch": 0.11685823754789272, "grad_norm": 15.292831420898438, "learning_rate": 4.942105263157895e-06, "loss": 1.535, "step": 122 }, { "epoch": 0.11685823754789272, "loss_full_dim": 0.7322998046875, "loss_main": 1.4972517490386963, "loss_parscale": 1.5, "loss_sub_dim": 0.7649519443511963, "loss_vclub": 0.00016021728515625, "parscale_sim": 0.9921875, "step": 122 }, { "epoch": 0.11781609195402298, "grad_norm": 256.1037902832031, "learning_rate": 4.939473684210526e-06, "loss": 1.4973, "step": 123 }, { "epoch": 0.11781609195402298, "loss_full_dim": 0.6803653836250305, "loss_main": 1.3966116905212402, "loss_parscale": 1.375, "loss_sub_dim": 0.7162463665008545, "loss_vclub": 0.0001220703125, "parscale_sim": 0.9921875, "step": 123 }, { "epoch": 0.11877394636015326, "grad_norm": 13.272331237792969, "learning_rate": 4.936842105263158e-06, "loss": 1.3966, "step": 124 }, { "epoch": 0.11877394636015326, "loss_full_dim": 0.6813011765480042, "loss_main": 1.3938724994659424, "loss_parscale": 1.390625, "loss_sub_dim": 0.7125713229179382, "loss_vclub": 0.00017261505126953125, "parscale_sim": 0.9921875, "step": 124 }, { "epoch": 0.11973180076628352, "grad_norm": 20.107498168945312, "learning_rate": 4.9342105263157895e-06, "loss": 1.3939, "step": 125 }, { "epoch": 0.11973180076628352, "loss_full_dim": 0.6533006429672241, "loss_main": 1.3355116844177246, "loss_parscale": 1.3359375, "loss_sub_dim": 0.6822110414505005, "loss_vclub": 0.0001926422119140625, "parscale_sim": 0.98828125, "step": 125 }, { "epoch": 0.1206896551724138, "grad_norm": 11.895833969116211, "learning_rate": 4.9315789473684215e-06, "loss": 1.3355, "step": 126 }, { "epoch": 0.1206896551724138, "loss_full_dim": 0.64657062292099, "loss_main": 1.3207228183746338, "loss_parscale": 1.3203125, "loss_sub_dim": 0.674152135848999, "loss_vclub": 0.00012493133544921875, "parscale_sim": 0.9921875, "step": 126 }, { "epoch": 0.12164750957854406, "grad_norm": 9.32886028289795, "learning_rate": 4.9289473684210535e-06, "loss": 1.3207, "step": 127 }, { "epoch": 0.12164750957854406, "loss_full_dim": 0.7857539057731628, "loss_main": 1.600822925567627, "loss_parscale": 1.578125, "loss_sub_dim": 0.8150689601898193, "loss_vclub": 0.00025177001953125, "parscale_sim": 0.9921875, "step": 127 }, { "epoch": 0.12260536398467432, "grad_norm": 11.819393157958984, "learning_rate": 4.926315789473685e-06, "loss": 1.6008, "step": 128 }, { "epoch": 0.12260536398467432, "loss_full_dim": 0.6893237829208374, "loss_main": 1.4111006259918213, "loss_parscale": 1.4140625, "loss_sub_dim": 0.7217768430709839, "loss_vclub": 0.0002040863037109375, "parscale_sim": 0.9921875, "step": 128 }, { "epoch": 0.1235632183908046, "grad_norm": 11.956400871276855, "learning_rate": 4.923684210526316e-06, "loss": 1.4111, "step": 129 }, { "epoch": 0.1235632183908046, "loss_full_dim": 0.6201918721199036, "loss_main": 1.270528793334961, "loss_parscale": 1.2890625, "loss_sub_dim": 0.6503369808197021, "loss_vclub": 0.00015926361083984375, "parscale_sim": 0.98828125, "step": 129 }, { "epoch": 0.12452107279693486, "grad_norm": 14.44473648071289, "learning_rate": 4.921052631578948e-06, "loss": 1.2705, "step": 130 }, { "epoch": 0.12452107279693486, "loss_full_dim": 0.7655284404754639, "loss_main": 1.5625271797180176, "loss_parscale": 1.546875, "loss_sub_dim": 0.7969987392425537, "loss_vclub": 0.0001468658447265625, "parscale_sim": 0.96484375, "step": 130 }, { "epoch": 0.12547892720306514, "grad_norm": 10.851838111877441, "learning_rate": 4.91842105263158e-06, "loss": 1.5625, "step": 131 }, { "epoch": 0.12547892720306514, "loss_full_dim": 0.7002301216125488, "loss_main": 1.428841233253479, "loss_parscale": 1.4296875, "loss_sub_dim": 0.7286111116409302, "loss_vclub": 0.0001697540283203125, "parscale_sim": 0.9921875, "step": 131 }, { "epoch": 0.12643678160919541, "grad_norm": 16.441316604614258, "learning_rate": 4.915789473684211e-06, "loss": 1.4288, "step": 132 }, { "epoch": 0.12643678160919541, "loss_full_dim": 0.6820343136787415, "loss_main": 1.3915579319000244, "loss_parscale": 1.3828125, "loss_sub_dim": 0.7095235586166382, "loss_vclub": 0.00020503997802734375, "parscale_sim": 0.9921875, "step": 132 }, { "epoch": 0.12739463601532566, "grad_norm": 13.290495872497559, "learning_rate": 4.913157894736842e-06, "loss": 1.3916, "step": 133 }, { "epoch": 0.12739463601532566, "loss_full_dim": 0.5552437901496887, "loss_main": 1.1424719095230103, "loss_parscale": 1.140625, "loss_sub_dim": 0.5872281193733215, "loss_vclub": 0.0002117156982421875, "parscale_sim": 0.9921875, "step": 133 }, { "epoch": 0.12835249042145594, "grad_norm": 9.854292869567871, "learning_rate": 4.910526315789474e-06, "loss": 1.1425, "step": 134 }, { "epoch": 0.12835249042145594, "loss_full_dim": 0.7192249298095703, "loss_main": 1.4705045223236084, "loss_parscale": 1.4609375, "loss_sub_dim": 0.7512795925140381, "loss_vclub": 0.00017833709716796875, "parscale_sim": 0.9921875, "step": 134 }, { "epoch": 0.12931034482758622, "grad_norm": 18.615766525268555, "learning_rate": 4.907894736842106e-06, "loss": 1.4705, "step": 135 }, { "epoch": 0.12931034482758622, "loss_full_dim": 0.6236118078231812, "loss_main": 1.2770565748214722, "loss_parscale": 1.2734375, "loss_sub_dim": 0.653444766998291, "loss_vclub": 0.00018215179443359375, "parscale_sim": 0.9921875, "step": 135 }, { "epoch": 0.13026819923371646, "grad_norm": 8.442452430725098, "learning_rate": 4.905263157894737e-06, "loss": 1.2771, "step": 136 }, { "epoch": 0.13026819923371646, "loss_full_dim": 0.5406930446624756, "loss_main": 1.1035267114639282, "loss_parscale": 1.109375, "loss_sub_dim": 0.5628336668014526, "loss_vclub": 0.00021648406982421875, "parscale_sim": 0.99609375, "step": 136 }, { "epoch": 0.13122605363984674, "grad_norm": 10.864567756652832, "learning_rate": 4.9026315789473685e-06, "loss": 1.1035, "step": 137 }, { "epoch": 0.13122605363984674, "loss_full_dim": 0.6393163204193115, "loss_main": 1.3059284687042236, "loss_parscale": 1.296875, "loss_sub_dim": 0.6666120886802673, "loss_vclub": 0.00018310546875, "parscale_sim": 0.9921875, "step": 137 }, { "epoch": 0.13218390804597702, "grad_norm": 10.385812759399414, "learning_rate": 4.9000000000000005e-06, "loss": 1.3059, "step": 138 }, { "epoch": 0.13218390804597702, "loss_full_dim": 0.6056349873542786, "loss_main": 1.2363100051879883, "loss_parscale": 1.2421875, "loss_sub_dim": 0.6306750774383545, "loss_vclub": 0.0002288818359375, "parscale_sim": 0.9921875, "step": 138 }, { "epoch": 0.1331417624521073, "grad_norm": 9.326362609863281, "learning_rate": 4.897368421052632e-06, "loss": 1.2363, "step": 139 }, { "epoch": 0.1331417624521073, "loss_full_dim": 0.590990424156189, "loss_main": 1.211578607559204, "loss_parscale": 1.2265625, "loss_sub_dim": 0.6205881834030151, "loss_vclub": 0.0002231597900390625, "parscale_sim": 0.9921875, "step": 139 }, { "epoch": 0.13409961685823754, "grad_norm": 14.025469779968262, "learning_rate": 4.894736842105264e-06, "loss": 1.2116, "step": 140 }, { "epoch": 0.13409961685823754, "loss_full_dim": 0.5866060853004456, "loss_main": 1.1980053186416626, "loss_parscale": 1.1875, "loss_sub_dim": 0.611399233341217, "loss_vclub": 0.00021839141845703125, "parscale_sim": 0.9921875, "step": 140 }, { "epoch": 0.13505747126436782, "grad_norm": 9.101794242858887, "learning_rate": 4.892105263157895e-06, "loss": 1.198, "step": 141 }, { "epoch": 0.13505747126436782, "loss_full_dim": 0.5927587151527405, "loss_main": 1.209796667098999, "loss_parscale": 1.2109375, "loss_sub_dim": 0.6170378923416138, "loss_vclub": 0.0002593994140625, "parscale_sim": 0.9921875, "step": 141 }, { "epoch": 0.1360153256704981, "grad_norm": 9.212407112121582, "learning_rate": 4.889473684210527e-06, "loss": 1.2098, "step": 142 }, { "epoch": 0.1360153256704981, "loss_full_dim": 0.6582940220832825, "loss_main": 1.3508350849151611, "loss_parscale": 1.3515625, "loss_sub_dim": 0.6925411224365234, "loss_vclub": 0.00023365020751953125, "parscale_sim": 0.984375, "step": 142 }, { "epoch": 0.13697318007662834, "grad_norm": 24.496973037719727, "learning_rate": 4.886842105263158e-06, "loss": 1.3508, "step": 143 }, { "epoch": 0.13697318007662834, "loss_full_dim": 0.6102806329727173, "loss_main": 1.247961401939392, "loss_parscale": 1.25, "loss_sub_dim": 0.6376807689666748, "loss_vclub": 0.0001926422119140625, "parscale_sim": 0.98828125, "step": 143 }, { "epoch": 0.13793103448275862, "grad_norm": 9.287469863891602, "learning_rate": 4.88421052631579e-06, "loss": 1.248, "step": 144 }, { "epoch": 0.13793103448275862, "loss_full_dim": 0.6395445466041565, "loss_main": 1.3070592880249023, "loss_parscale": 1.3125, "loss_sub_dim": 0.6675146818161011, "loss_vclub": 0.000202178955078125, "parscale_sim": 0.99609375, "step": 144 }, { "epoch": 0.1388888888888889, "grad_norm": 12.07665729522705, "learning_rate": 4.881578947368422e-06, "loss": 1.3071, "step": 145 }, { "epoch": 0.1388888888888889, "loss_full_dim": 0.46298596262931824, "loss_main": 0.9479407072067261, "loss_parscale": 0.953125, "loss_sub_dim": 0.48495474457740784, "loss_vclub": 0.0002193450927734375, "parscale_sim": 0.9921875, "step": 145 }, { "epoch": 0.13984674329501914, "grad_norm": 10.550821304321289, "learning_rate": 4.878947368421053e-06, "loss": 0.9479, "step": 146 }, { "epoch": 0.13984674329501914, "loss_full_dim": 0.6001034379005432, "loss_main": 1.2241120338439941, "loss_parscale": 1.2265625, "loss_sub_dim": 0.6240086555480957, "loss_vclub": 0.0002651214599609375, "parscale_sim": 0.9921875, "step": 146 }, { "epoch": 0.14080459770114942, "grad_norm": 10.426642417907715, "learning_rate": 4.876315789473684e-06, "loss": 1.2241, "step": 147 }, { "epoch": 0.14080459770114942, "loss_full_dim": 0.6748762130737305, "loss_main": 1.375575065612793, "loss_parscale": 1.375, "loss_sub_dim": 0.7006989121437073, "loss_vclub": 0.00022983551025390625, "parscale_sim": 0.9921875, "step": 147 }, { "epoch": 0.1417624521072797, "grad_norm": 14.163178443908691, "learning_rate": 4.873684210526316e-06, "loss": 1.3756, "step": 148 }, { "epoch": 0.1417624521072797, "loss_full_dim": 0.5950119495391846, "loss_main": 1.2189475297927856, "loss_parscale": 1.203125, "loss_sub_dim": 0.6239355802536011, "loss_vclub": 0.00022602081298828125, "parscale_sim": 0.98828125, "step": 148 }, { "epoch": 0.14272030651340997, "grad_norm": 10.176776885986328, "learning_rate": 4.871052631578948e-06, "loss": 1.2189, "step": 149 }, { "epoch": 0.14272030651340997, "loss_full_dim": 0.5770446062088013, "loss_main": 1.1826252937316895, "loss_parscale": 1.1875, "loss_sub_dim": 0.6055806279182434, "loss_vclub": 0.00022029876708984375, "parscale_sim": 0.9921875, "step": 149 }, { "epoch": 0.14367816091954022, "grad_norm": 12.211570739746094, "learning_rate": 4.8684210526315795e-06, "loss": 1.1826, "step": 150 }, { "epoch": 0.14367816091954022, "loss_full_dim": 0.7355414032936096, "loss_main": 1.4989280700683594, "loss_parscale": 1.4921875, "loss_sub_dim": 0.763386607170105, "loss_vclub": 0.0001926422119140625, "parscale_sim": 0.9921875, "step": 150 }, { "epoch": 0.1446360153256705, "grad_norm": 11.145161628723145, "learning_rate": 4.865789473684211e-06, "loss": 1.4989, "step": 151 }, { "epoch": 0.1446360153256705, "loss_full_dim": 0.5413535237312317, "loss_main": 1.1105239391326904, "loss_parscale": 1.1171875, "loss_sub_dim": 0.569170355796814, "loss_vclub": 0.00023174285888671875, "parscale_sim": 0.9921875, "step": 151 }, { "epoch": 0.14559386973180077, "grad_norm": 8.945379257202148, "learning_rate": 4.863157894736843e-06, "loss": 1.1105, "step": 152 }, { "epoch": 0.14559386973180077, "loss_full_dim": 0.5606626272201538, "loss_main": 1.146736741065979, "loss_parscale": 1.1484375, "loss_sub_dim": 0.5860741138458252, "loss_vclub": 0.00028228759765625, "parscale_sim": 0.9921875, "step": 152 }, { "epoch": 0.14655172413793102, "grad_norm": 13.268875122070312, "learning_rate": 4.860526315789474e-06, "loss": 1.1467, "step": 153 }, { "epoch": 0.14655172413793102, "loss_full_dim": 0.5205703973770142, "loss_main": 1.0646435022354126, "loss_parscale": 1.0625, "loss_sub_dim": 0.5440731048583984, "loss_vclub": 0.000293731689453125, "parscale_sim": 0.9921875, "step": 153 }, { "epoch": 0.1475095785440613, "grad_norm": 9.784695625305176, "learning_rate": 4.857894736842106e-06, "loss": 1.0646, "step": 154 }, { "epoch": 0.1475095785440613, "loss_full_dim": 0.6042582392692566, "loss_main": 1.2339861392974854, "loss_parscale": 1.21875, "loss_sub_dim": 0.6297279596328735, "loss_vclub": 0.00023174285888671875, "parscale_sim": 0.984375, "step": 154 }, { "epoch": 0.14846743295019157, "grad_norm": 11.406333923339844, "learning_rate": 4.855263157894737e-06, "loss": 1.234, "step": 155 }, { "epoch": 0.14846743295019157, "loss_full_dim": 0.6703149080276489, "loss_main": 1.3719580173492432, "loss_parscale": 1.375, "loss_sub_dim": 0.701643168926239, "loss_vclub": 0.000270843505859375, "parscale_sim": 0.9921875, "step": 155 }, { "epoch": 0.14942528735632185, "grad_norm": 6.974386692047119, "learning_rate": 4.852631578947369e-06, "loss": 1.372, "step": 156 }, { "epoch": 0.14942528735632185, "loss_full_dim": 0.5932793021202087, "loss_main": 1.2117798328399658, "loss_parscale": 1.21875, "loss_sub_dim": 0.6185004711151123, "loss_vclub": 0.00026702880859375, "parscale_sim": 0.9921875, "step": 156 }, { "epoch": 0.1503831417624521, "grad_norm": 9.421100616455078, "learning_rate": 4.85e-06, "loss": 1.2118, "step": 157 }, { "epoch": 0.1503831417624521, "loss_full_dim": 0.6871650218963623, "loss_main": 1.4046292304992676, "loss_parscale": 1.40625, "loss_sub_dim": 0.7174642086029053, "loss_vclub": 0.00026702880859375, "parscale_sim": 0.98828125, "step": 157 }, { "epoch": 0.15134099616858238, "grad_norm": 8.739019393920898, "learning_rate": 4.847368421052631e-06, "loss": 1.4046, "step": 158 }, { "epoch": 0.15134099616858238, "loss_full_dim": 0.6217579245567322, "loss_main": 1.2681126594543457, "loss_parscale": 1.2578125, "loss_sub_dim": 0.6463546752929688, "loss_vclub": 0.000270843505859375, "parscale_sim": 0.99609375, "step": 158 }, { "epoch": 0.15229885057471265, "grad_norm": 8.013668060302734, "learning_rate": 4.844736842105263e-06, "loss": 1.2681, "step": 159 }, { "epoch": 0.15229885057471265, "loss_full_dim": 0.5960524082183838, "loss_main": 1.2171776294708252, "loss_parscale": 1.1953125, "loss_sub_dim": 0.6211252212524414, "loss_vclub": 0.00029754638671875, "parscale_sim": 0.9921875, "step": 159 }, { "epoch": 0.1532567049808429, "grad_norm": 9.50171184539795, "learning_rate": 4.842105263157895e-06, "loss": 1.2172, "step": 160 }, { "epoch": 0.1532567049808429, "loss_full_dim": 0.4957144856452942, "loss_main": 1.0150651931762695, "loss_parscale": 1.0078125, "loss_sub_dim": 0.5193507671356201, "loss_vclub": 0.000347137451171875, "parscale_sim": 0.96484375, "step": 160 }, { "epoch": 0.15421455938697318, "grad_norm": 27.193347930908203, "learning_rate": 4.8394736842105265e-06, "loss": 1.0151, "step": 161 }, { "epoch": 0.15421455938697318, "loss_full_dim": 0.6007430553436279, "loss_main": 1.226610541343689, "loss_parscale": 1.2265625, "loss_sub_dim": 0.625867486000061, "loss_vclub": 0.000286102294921875, "parscale_sim": 0.984375, "step": 161 }, { "epoch": 0.15517241379310345, "grad_norm": 9.564090728759766, "learning_rate": 4.8368421052631585e-06, "loss": 1.2266, "step": 162 }, { "epoch": 0.15517241379310345, "loss_full_dim": 0.5936360955238342, "loss_main": 1.2128828763961792, "loss_parscale": 1.21875, "loss_sub_dim": 0.619246780872345, "loss_vclub": 0.0003204345703125, "parscale_sim": 0.9921875, "step": 162 }, { "epoch": 0.15613026819923373, "grad_norm": 9.269503593444824, "learning_rate": 4.8342105263157905e-06, "loss": 1.2129, "step": 163 }, { "epoch": 0.15613026819923373, "loss_full_dim": 0.5406423211097717, "loss_main": 1.1045386791229248, "loss_parscale": 1.109375, "loss_sub_dim": 0.5638963580131531, "loss_vclub": 0.000324249267578125, "parscale_sim": 0.98828125, "step": 163 }, { "epoch": 0.15708812260536398, "grad_norm": 10.17910385131836, "learning_rate": 4.831578947368422e-06, "loss": 1.1045, "step": 164 }, { "epoch": 0.15708812260536398, "loss_full_dim": 0.5160215497016907, "loss_main": 1.0552785396575928, "loss_parscale": 1.0625, "loss_sub_dim": 0.5392570495605469, "loss_vclub": 0.00029754638671875, "parscale_sim": 0.9921875, "step": 164 }, { "epoch": 0.15804597701149425, "grad_norm": 8.10223388671875, "learning_rate": 4.828947368421053e-06, "loss": 1.0553, "step": 165 }, { "epoch": 0.15804597701149425, "loss_full_dim": 0.5982442498207092, "loss_main": 1.2224602699279785, "loss_parscale": 1.21875, "loss_sub_dim": 0.6242159605026245, "loss_vclub": 0.00026702880859375, "parscale_sim": 0.9921875, "step": 165 }, { "epoch": 0.15900383141762453, "grad_norm": 13.964245796203613, "learning_rate": 4.826315789473685e-06, "loss": 1.2225, "step": 166 }, { "epoch": 0.15900383141762453, "loss_full_dim": 0.7109273076057434, "loss_main": 1.4534235000610352, "loss_parscale": 1.453125, "loss_sub_dim": 0.742496132850647, "loss_vclub": 0.0002765655517578125, "parscale_sim": 0.9921875, "step": 166 }, { "epoch": 0.15996168582375478, "grad_norm": 10.008874893188477, "learning_rate": 4.823684210526316e-06, "loss": 1.4534, "step": 167 }, { "epoch": 0.15996168582375478, "loss_full_dim": 0.5840385556221008, "loss_main": 1.1929564476013184, "loss_parscale": 1.1875, "loss_sub_dim": 0.6089178919792175, "loss_vclub": 0.0003032684326171875, "parscale_sim": 0.9921875, "step": 167 }, { "epoch": 0.16091954022988506, "grad_norm": 7.705746173858643, "learning_rate": 4.821052631578948e-06, "loss": 1.193, "step": 168 }, { "epoch": 0.16091954022988506, "loss_full_dim": 0.6494128704071045, "loss_main": 1.3238462209701538, "loss_parscale": 1.3046875, "loss_sub_dim": 0.6744333505630493, "loss_vclub": 0.0002727508544921875, "parscale_sim": 0.9921875, "step": 168 }, { "epoch": 0.16187739463601533, "grad_norm": 11.03174114227295, "learning_rate": 4.818421052631579e-06, "loss": 1.3238, "step": 169 }, { "epoch": 0.16187739463601533, "loss_full_dim": 0.6205196976661682, "loss_main": 1.2658076286315918, "loss_parscale": 1.265625, "loss_sub_dim": 0.6452879905700684, "loss_vclub": 0.000308990478515625, "parscale_sim": 0.9921875, "step": 169 }, { "epoch": 0.16283524904214558, "grad_norm": 14.727489471435547, "learning_rate": 4.815789473684211e-06, "loss": 1.2658, "step": 170 }, { "epoch": 0.16283524904214558, "loss_full_dim": 0.5832352042198181, "loss_main": 1.1941728591918945, "loss_parscale": 1.1953125, "loss_sub_dim": 0.6109375953674316, "loss_vclub": 0.0002956390380859375, "parscale_sim": 0.96484375, "step": 170 }, { "epoch": 0.16379310344827586, "grad_norm": 7.897994518280029, "learning_rate": 4.813157894736842e-06, "loss": 1.1942, "step": 171 }, { "epoch": 0.16379310344827586, "loss_full_dim": 0.56663578748703, "loss_main": 1.1556179523468018, "loss_parscale": 1.15625, "loss_sub_dim": 0.588982105255127, "loss_vclub": 0.000278472900390625, "parscale_sim": 0.9921875, "step": 171 }, { "epoch": 0.16475095785440613, "grad_norm": 9.519448280334473, "learning_rate": 4.8105263157894735e-06, "loss": 1.1556, "step": 172 }, { "epoch": 0.16475095785440613, "loss_full_dim": 0.5771375894546509, "loss_main": 1.182119607925415, "loss_parscale": 1.1953125, "loss_sub_dim": 0.6049820780754089, "loss_vclub": 0.000316619873046875, "parscale_sim": 0.98828125, "step": 172 }, { "epoch": 0.1657088122605364, "grad_norm": 15.688178062438965, "learning_rate": 4.8078947368421055e-06, "loss": 1.1821, "step": 173 }, { "epoch": 0.1657088122605364, "loss_full_dim": 0.5495803356170654, "loss_main": 1.1237319707870483, "loss_parscale": 1.140625, "loss_sub_dim": 0.5741516351699829, "loss_vclub": 0.000293731689453125, "parscale_sim": 0.9921875, "step": 173 }, { "epoch": 0.16666666666666666, "grad_norm": 8.002904891967773, "learning_rate": 4.8052631578947375e-06, "loss": 1.1237, "step": 174 }, { "epoch": 0.16666666666666666, "loss_full_dim": 0.6016480326652527, "loss_main": 1.230215311050415, "loss_parscale": 1.21875, "loss_sub_dim": 0.6285672187805176, "loss_vclub": 0.00034332275390625, "parscale_sim": 0.98828125, "step": 174 }, { "epoch": 0.16762452107279693, "grad_norm": 11.280355453491211, "learning_rate": 4.802631578947369e-06, "loss": 1.2302, "step": 175 }, { "epoch": 0.16762452107279693, "loss_full_dim": 0.6279818415641785, "loss_main": 1.2830159664154053, "loss_parscale": 1.2734375, "loss_sub_dim": 0.6550341248512268, "loss_vclub": 0.0002651214599609375, "parscale_sim": 0.9921875, "step": 175 }, { "epoch": 0.1685823754789272, "grad_norm": 11.521688461303711, "learning_rate": 4.800000000000001e-06, "loss": 1.283, "step": 176 }, { "epoch": 0.1685823754789272, "loss_full_dim": 0.517486035823822, "loss_main": 1.060340404510498, "loss_parscale": 1.0703125, "loss_sub_dim": 0.542854368686676, "loss_vclub": 0.000335693359375, "parscale_sim": 0.9921875, "step": 176 }, { "epoch": 0.16954022988505746, "grad_norm": 10.481809616088867, "learning_rate": 4.797368421052633e-06, "loss": 1.0603, "step": 177 }, { "epoch": 0.16954022988505746, "loss_full_dim": 0.5004745721817017, "loss_main": 1.023289442062378, "loss_parscale": 1.03125, "loss_sub_dim": 0.5228148698806763, "loss_vclub": 0.0003261566162109375, "parscale_sim": 0.98828125, "step": 177 }, { "epoch": 0.17049808429118773, "grad_norm": 15.264375686645508, "learning_rate": 4.794736842105264e-06, "loss": 1.0233, "step": 178 }, { "epoch": 0.17049808429118773, "loss_full_dim": 0.543420135974884, "loss_main": 1.1113494634628296, "loss_parscale": 1.109375, "loss_sub_dim": 0.5679293274879456, "loss_vclub": 0.0002899169921875, "parscale_sim": 0.984375, "step": 178 }, { "epoch": 0.171455938697318, "grad_norm": 20.13178253173828, "learning_rate": 4.792105263157895e-06, "loss": 1.1113, "step": 179 }, { "epoch": 0.171455938697318, "loss_full_dim": 0.6116650104522705, "loss_main": 1.248386263847351, "loss_parscale": 1.25, "loss_sub_dim": 0.6367212533950806, "loss_vclub": 0.00022983551025390625, "parscale_sim": 0.9921875, "step": 179 }, { "epoch": 0.1724137931034483, "grad_norm": 9.096227645874023, "learning_rate": 4.789473684210527e-06, "loss": 1.2484, "step": 180 }, { "epoch": 0.1724137931034483, "loss_full_dim": 0.5068237781524658, "loss_main": 1.0390708446502686, "loss_parscale": 1.046875, "loss_sub_dim": 0.5322471261024475, "loss_vclub": 0.00034332275390625, "parscale_sim": 0.98828125, "step": 180 }, { "epoch": 0.17337164750957854, "grad_norm": 10.203383445739746, "learning_rate": 4.786842105263158e-06, "loss": 1.0391, "step": 181 }, { "epoch": 0.17337164750957854, "loss_full_dim": 0.49830856919288635, "loss_main": 1.0225160121917725, "loss_parscale": 1.0234375, "loss_sub_dim": 0.5242074728012085, "loss_vclub": 0.0003204345703125, "parscale_sim": 0.98828125, "step": 181 }, { "epoch": 0.1743295019157088, "grad_norm": 7.941391468048096, "learning_rate": 4.78421052631579e-06, "loss": 1.0225, "step": 182 }, { "epoch": 0.1743295019157088, "loss_full_dim": 0.584496021270752, "loss_main": 1.1927193403244019, "loss_parscale": 1.1953125, "loss_sub_dim": 0.6082233190536499, "loss_vclub": 0.00032806396484375, "parscale_sim": 0.9921875, "step": 182 }, { "epoch": 0.1752873563218391, "grad_norm": 12.881722450256348, "learning_rate": 4.781578947368421e-06, "loss": 1.1927, "step": 183 }, { "epoch": 0.1752873563218391, "loss_full_dim": 0.5647264719009399, "loss_main": 1.1571580171585083, "loss_parscale": 1.15625, "loss_sub_dim": 0.5924315452575684, "loss_vclub": 0.0003643035888671875, "parscale_sim": 0.9921875, "step": 183 }, { "epoch": 0.17624521072796934, "grad_norm": 9.023982048034668, "learning_rate": 4.778947368421053e-06, "loss": 1.1572, "step": 184 }, { "epoch": 0.17624521072796934, "loss_full_dim": 0.5909804105758667, "loss_main": 1.2077440023422241, "loss_parscale": 1.203125, "loss_sub_dim": 0.6167635917663574, "loss_vclub": 0.00029754638671875, "parscale_sim": 0.9921875, "step": 184 }, { "epoch": 0.1772030651340996, "grad_norm": 76.45648956298828, "learning_rate": 4.7763157894736844e-06, "loss": 1.2077, "step": 185 }, { "epoch": 0.1772030651340996, "loss_full_dim": 0.6564964652061462, "loss_main": 1.336677074432373, "loss_parscale": 1.328125, "loss_sub_dim": 0.6801806688308716, "loss_vclub": 0.0003509521484375, "parscale_sim": 0.9921875, "step": 185 }, { "epoch": 0.1781609195402299, "grad_norm": 11.091370582580566, "learning_rate": 4.773684210526316e-06, "loss": 1.3367, "step": 186 }, { "epoch": 0.1781609195402299, "loss_full_dim": 0.6620768904685974, "loss_main": 1.359856367111206, "loss_parscale": 1.359375, "loss_sub_dim": 0.6977794170379639, "loss_vclub": 0.0003108978271484375, "parscale_sim": 0.9921875, "step": 186 }, { "epoch": 0.17911877394636017, "grad_norm": 15.067858695983887, "learning_rate": 4.771052631578948e-06, "loss": 1.3599, "step": 187 }, { "epoch": 0.17911877394636017, "loss_full_dim": 0.6332782506942749, "loss_main": 1.305781602859497, "loss_parscale": 1.3046875, "loss_sub_dim": 0.6725033521652222, "loss_vclub": 0.000335693359375, "parscale_sim": 0.9921875, "step": 187 }, { "epoch": 0.18007662835249041, "grad_norm": 14.760784149169922, "learning_rate": 4.76842105263158e-06, "loss": 1.3058, "step": 188 }, { "epoch": 0.18007662835249041, "loss_full_dim": 0.5287082195281982, "loss_main": 1.0830856561660767, "loss_parscale": 1.0859375, "loss_sub_dim": 0.5543774366378784, "loss_vclub": 0.000354766845703125, "parscale_sim": 0.9921875, "step": 188 }, { "epoch": 0.1810344827586207, "grad_norm": 10.186994552612305, "learning_rate": 4.765789473684211e-06, "loss": 1.0831, "step": 189 }, { "epoch": 0.1810344827586207, "loss_full_dim": 0.511587917804718, "loss_main": 1.0547235012054443, "loss_parscale": 1.0703125, "loss_sub_dim": 0.5431355237960815, "loss_vclub": 0.00030517578125, "parscale_sim": 0.9921875, "step": 189 }, { "epoch": 0.18199233716475097, "grad_norm": 15.530198097229004, "learning_rate": 4.763157894736842e-06, "loss": 1.0547, "step": 190 }, { "epoch": 0.18199233716475097, "loss_full_dim": 0.6336449384689331, "loss_main": 1.2943851947784424, "loss_parscale": 1.296875, "loss_sub_dim": 0.6607402563095093, "loss_vclub": 0.0003814697265625, "parscale_sim": 0.9921875, "step": 190 }, { "epoch": 0.18295019157088122, "grad_norm": 21.961284637451172, "learning_rate": 4.760526315789474e-06, "loss": 1.2944, "step": 191 }, { "epoch": 0.18295019157088122, "loss_full_dim": 0.5297907590866089, "loss_main": 1.0845223665237427, "loss_parscale": 1.09375, "loss_sub_dim": 0.5547316074371338, "loss_vclub": 0.00037384033203125, "parscale_sim": 0.9921875, "step": 191 }, { "epoch": 0.1839080459770115, "grad_norm": 11.158629417419434, "learning_rate": 4.757894736842106e-06, "loss": 1.0845, "step": 192 }, { "epoch": 0.1839080459770115, "loss_full_dim": 0.4654548168182373, "loss_main": 0.955501914024353, "loss_parscale": 0.953125, "loss_sub_dim": 0.4900470972061157, "loss_vclub": 0.000278472900390625, "parscale_sim": 0.9921875, "step": 192 }, { "epoch": 0.18486590038314177, "grad_norm": 9.870272636413574, "learning_rate": 4.755263157894737e-06, "loss": 0.9555, "step": 193 }, { "epoch": 0.18486590038314177, "loss_full_dim": 0.48131194710731506, "loss_main": 0.9881337881088257, "loss_parscale": 1.0078125, "loss_sub_dim": 0.506821870803833, "loss_vclub": 0.0003643035888671875, "parscale_sim": 0.98828125, "step": 193 }, { "epoch": 0.18582375478927204, "grad_norm": 10.931159019470215, "learning_rate": 4.752631578947369e-06, "loss": 0.9881, "step": 194 }, { "epoch": 0.18582375478927204, "loss_full_dim": 0.588736355304718, "loss_main": 1.2060147523880005, "loss_parscale": 1.203125, "loss_sub_dim": 0.6172783970832825, "loss_vclub": 0.000392913818359375, "parscale_sim": 0.9921875, "step": 194 }, { "epoch": 0.1867816091954023, "grad_norm": 8.466790199279785, "learning_rate": 4.75e-06, "loss": 1.206, "step": 195 }, { "epoch": 0.1867816091954023, "loss_full_dim": 0.515739917755127, "loss_main": 1.0558748245239258, "loss_parscale": 1.046875, "loss_sub_dim": 0.5401349067687988, "loss_vclub": 0.0002727508544921875, "parscale_sim": 0.9921875, "step": 195 }, { "epoch": 0.18773946360153257, "grad_norm": 8.808269500732422, "learning_rate": 4.747368421052632e-06, "loss": 1.0559, "step": 196 }, { "epoch": 0.18773946360153257, "loss_full_dim": 0.5310037732124329, "loss_main": 1.0836825370788574, "loss_parscale": 1.09375, "loss_sub_dim": 0.5526787042617798, "loss_vclub": 0.000392913818359375, "parscale_sim": 0.9921875, "step": 196 }, { "epoch": 0.18869731800766285, "grad_norm": 10.774430274963379, "learning_rate": 4.7447368421052634e-06, "loss": 1.0837, "step": 197 }, { "epoch": 0.18869731800766285, "loss_full_dim": 0.46851444244384766, "loss_main": 0.9592602252960205, "loss_parscale": 0.95703125, "loss_sub_dim": 0.49074578285217285, "loss_vclub": 0.0003681182861328125, "parscale_sim": 0.9921875, "step": 197 }, { "epoch": 0.1896551724137931, "grad_norm": 9.178333282470703, "learning_rate": 4.7421052631578954e-06, "loss": 0.9593, "step": 198 }, { "epoch": 0.1896551724137931, "loss_full_dim": 0.5537492036819458, "loss_main": 1.130022644996643, "loss_parscale": 1.125, "loss_sub_dim": 0.5762734413146973, "loss_vclub": 0.000354766845703125, "parscale_sim": 0.98828125, "step": 198 }, { "epoch": 0.19061302681992337, "grad_norm": 7.5554399490356445, "learning_rate": 4.739473684210527e-06, "loss": 1.13, "step": 199 }, { "epoch": 0.19061302681992337, "loss_full_dim": 0.4872814416885376, "loss_main": 1.0027453899383545, "loss_parscale": 1.015625, "loss_sub_dim": 0.5154639482498169, "loss_vclub": 0.000431060791015625, "parscale_sim": 0.9921875, "step": 199 }, { "epoch": 0.19157088122605365, "grad_norm": 10.593024253845215, "learning_rate": 4.736842105263158e-06, "loss": 1.0027, "step": 200 }, { "epoch": 0.19157088122605365, "loss_full_dim": 0.5341861844062805, "loss_main": 1.092667818069458, "loss_parscale": 1.09375, "loss_sub_dim": 0.5584815740585327, "loss_vclub": 0.000377655029296875, "parscale_sim": 0.9921875, "step": 200 }, { "epoch": 0.1925287356321839, "grad_norm": 9.324244499206543, "learning_rate": 4.73421052631579e-06, "loss": 1.0927, "step": 201 }, { "epoch": 0.1925287356321839, "loss_full_dim": 0.5317597389221191, "loss_main": 1.0875835418701172, "loss_parscale": 1.0703125, "loss_sub_dim": 0.555823802947998, "loss_vclub": 0.00038909912109375, "parscale_sim": 0.98828125, "step": 201 }, { "epoch": 0.19348659003831417, "grad_norm": 9.47535514831543, "learning_rate": 4.731578947368422e-06, "loss": 1.0876, "step": 202 }, { "epoch": 0.19348659003831417, "loss_full_dim": 0.5115731954574585, "loss_main": 1.0457274913787842, "loss_parscale": 1.03125, "loss_sub_dim": 0.5341542959213257, "loss_vclub": 0.000446319580078125, "parscale_sim": 0.9921875, "step": 202 }, { "epoch": 0.19444444444444445, "grad_norm": 8.389193534851074, "learning_rate": 4.728947368421053e-06, "loss": 1.0457, "step": 203 }, { "epoch": 0.19444444444444445, "loss_full_dim": 0.5728447437286377, "loss_main": 1.1707309484481812, "loss_parscale": 1.171875, "loss_sub_dim": 0.5978862047195435, "loss_vclub": 0.0003871917724609375, "parscale_sim": 0.98828125, "step": 203 }, { "epoch": 0.19540229885057472, "grad_norm": 8.570068359375, "learning_rate": 4.726315789473684e-06, "loss": 1.1707, "step": 204 }, { "epoch": 0.19540229885057472, "loss_full_dim": 0.5078824162483215, "loss_main": 1.0383634567260742, "loss_parscale": 1.03125, "loss_sub_dim": 0.5304810404777527, "loss_vclub": 0.000392913818359375, "parscale_sim": 0.9921875, "step": 204 }, { "epoch": 0.19636015325670497, "grad_norm": 7.063410758972168, "learning_rate": 4.723684210526316e-06, "loss": 1.0384, "step": 205 }, { "epoch": 0.19636015325670497, "loss_full_dim": 0.54095458984375, "loss_main": 1.102763056755066, "loss_parscale": 1.109375, "loss_sub_dim": 0.5618084669113159, "loss_vclub": 0.0003490447998046875, "parscale_sim": 0.9921875, "step": 205 }, { "epoch": 0.19731800766283525, "grad_norm": 8.479392051696777, "learning_rate": 4.721052631578948e-06, "loss": 1.1028, "step": 206 }, { "epoch": 0.19731800766283525, "loss_full_dim": 0.4663238227367401, "loss_main": 0.9557645320892334, "loss_parscale": 0.95703125, "loss_sub_dim": 0.4894407391548157, "loss_vclub": 0.00045013427734375, "parscale_sim": 0.98828125, "step": 206 }, { "epoch": 0.19827586206896552, "grad_norm": 11.849605560302734, "learning_rate": 4.718421052631579e-06, "loss": 0.9558, "step": 207 }, { "epoch": 0.19827586206896552, "loss_full_dim": 0.5230794548988342, "loss_main": 1.068739891052246, "loss_parscale": 1.0625, "loss_sub_dim": 0.5456604957580566, "loss_vclub": 0.0004520416259765625, "parscale_sim": 0.9921875, "step": 207 }, { "epoch": 0.19923371647509577, "grad_norm": 8.24896240234375, "learning_rate": 4.71578947368421e-06, "loss": 1.0687, "step": 208 }, { "epoch": 0.19923371647509577, "loss_full_dim": 0.5274395942687988, "loss_main": 1.0800665616989136, "loss_parscale": 1.078125, "loss_sub_dim": 0.5526269674301147, "loss_vclub": 0.0003643035888671875, "parscale_sim": 0.98046875, "step": 208 }, { "epoch": 0.20019157088122605, "grad_norm": 9.249955177307129, "learning_rate": 4.713157894736842e-06, "loss": 1.0801, "step": 209 }, { "epoch": 0.20019157088122605, "loss_full_dim": 0.47910788655281067, "loss_main": 0.9817914962768555, "loss_parscale": 0.984375, "loss_sub_dim": 0.5026836395263672, "loss_vclub": 0.00032806396484375, "parscale_sim": 0.98828125, "step": 209 }, { "epoch": 0.20114942528735633, "grad_norm": 4.638356685638428, "learning_rate": 4.710526315789474e-06, "loss": 0.9818, "step": 210 }, { "epoch": 0.20114942528735633, "loss_full_dim": 0.4992765188217163, "loss_main": 1.0222327709197998, "loss_parscale": 1.0234375, "loss_sub_dim": 0.5229562520980835, "loss_vclub": 0.000415802001953125, "parscale_sim": 0.9921875, "step": 210 }, { "epoch": 0.2021072796934866, "grad_norm": 18.17121124267578, "learning_rate": 4.7078947368421056e-06, "loss": 1.0222, "step": 211 }, { "epoch": 0.2021072796934866, "loss_full_dim": 0.4751662015914917, "loss_main": 0.9704107642173767, "loss_parscale": 0.9765625, "loss_sub_dim": 0.495244562625885, "loss_vclub": 0.000415802001953125, "parscale_sim": 0.98828125, "step": 211 }, { "epoch": 0.20306513409961685, "grad_norm": 8.27853775024414, "learning_rate": 4.705263157894738e-06, "loss": 0.9704, "step": 212 }, { "epoch": 0.20306513409961685, "loss_full_dim": 0.5604925155639648, "loss_main": 1.1453824043273926, "loss_parscale": 1.15625, "loss_sub_dim": 0.5848898887634277, "loss_vclub": 0.000354766845703125, "parscale_sim": 0.98828125, "step": 212 }, { "epoch": 0.20402298850574713, "grad_norm": 9.36913013458252, "learning_rate": 4.702631578947369e-06, "loss": 1.1454, "step": 213 }, { "epoch": 0.20402298850574713, "loss_full_dim": 0.5059170722961426, "loss_main": 1.0323262214660645, "loss_parscale": 1.03125, "loss_sub_dim": 0.5264091491699219, "loss_vclub": 0.00035858154296875, "parscale_sim": 0.984375, "step": 213 }, { "epoch": 0.2049808429118774, "grad_norm": 7.547029972076416, "learning_rate": 4.7e-06, "loss": 1.0323, "step": 214 }, { "epoch": 0.2049808429118774, "loss_full_dim": 0.5274125933647156, "loss_main": 1.079223871231079, "loss_parscale": 1.078125, "loss_sub_dim": 0.5518113374710083, "loss_vclub": 0.0004119873046875, "parscale_sim": 0.9921875, "step": 214 }, { "epoch": 0.20593869731800765, "grad_norm": 10.53579044342041, "learning_rate": 4.697368421052632e-06, "loss": 1.0792, "step": 215 }, { "epoch": 0.20593869731800765, "loss_full_dim": 0.4969152510166168, "loss_main": 1.0158240795135498, "loss_parscale": 1.015625, "loss_sub_dim": 0.5189088582992554, "loss_vclub": 0.0004062652587890625, "parscale_sim": 0.9921875, "step": 215 }, { "epoch": 0.20689655172413793, "grad_norm": 182.4242401123047, "learning_rate": 4.694736842105264e-06, "loss": 1.0158, "step": 216 }, { "epoch": 0.20689655172413793, "loss_full_dim": 0.47677457332611084, "loss_main": 0.9767569303512573, "loss_parscale": 0.9765625, "loss_sub_dim": 0.4999823272228241, "loss_vclub": 0.000484466552734375, "parscale_sim": 0.9921875, "step": 216 }, { "epoch": 0.2078544061302682, "grad_norm": 405.1500244140625, "learning_rate": 4.692105263157895e-06, "loss": 0.9768, "step": 217 }, { "epoch": 0.2078544061302682, "loss_full_dim": 0.501966655254364, "loss_main": 1.0282154083251953, "loss_parscale": 1.03125, "loss_sub_dim": 0.5262486934661865, "loss_vclub": 0.000362396240234375, "parscale_sim": 0.9921875, "step": 217 }, { "epoch": 0.20881226053639848, "grad_norm": 10.953872680664062, "learning_rate": 4.689473684210526e-06, "loss": 1.0282, "step": 218 }, { "epoch": 0.20881226053639848, "loss_full_dim": 0.5510133504867554, "loss_main": 1.1260230541229248, "loss_parscale": 1.140625, "loss_sub_dim": 0.5750097036361694, "loss_vclub": 0.000385284423828125, "parscale_sim": 0.9921875, "step": 218 }, { "epoch": 0.20977011494252873, "grad_norm": 10.328356742858887, "learning_rate": 4.686842105263158e-06, "loss": 1.126, "step": 219 }, { "epoch": 0.20977011494252873, "loss_full_dim": 0.5719544291496277, "loss_main": 1.1672308444976807, "loss_parscale": 1.171875, "loss_sub_dim": 0.595276415348053, "loss_vclub": 0.00038909912109375, "parscale_sim": 0.9921875, "step": 219 }, { "epoch": 0.210727969348659, "grad_norm": 9.254385948181152, "learning_rate": 4.68421052631579e-06, "loss": 1.1672, "step": 220 }, { "epoch": 0.210727969348659, "loss_full_dim": 0.49342820048332214, "loss_main": 1.0120505094528198, "loss_parscale": 1.015625, "loss_sub_dim": 0.5186222791671753, "loss_vclub": 0.0004596710205078125, "parscale_sim": 0.9921875, "step": 220 }, { "epoch": 0.21168582375478928, "grad_norm": 8.71795654296875, "learning_rate": 4.681578947368421e-06, "loss": 1.0121, "step": 221 }, { "epoch": 0.21168582375478928, "loss_full_dim": 0.4915499985218048, "loss_main": 1.0095373392105103, "loss_parscale": 1.0078125, "loss_sub_dim": 0.5179873704910278, "loss_vclub": 0.000484466552734375, "parscale_sim": 0.9921875, "step": 221 }, { "epoch": 0.21264367816091953, "grad_norm": 9.600993156433105, "learning_rate": 4.6789473684210525e-06, "loss": 1.0095, "step": 222 }, { "epoch": 0.21264367816091953, "loss_full_dim": 0.5491585731506348, "loss_main": 1.1240359544754028, "loss_parscale": 1.125, "loss_sub_dim": 0.5748773813247681, "loss_vclub": 0.000438690185546875, "parscale_sim": 0.9921875, "step": 222 }, { "epoch": 0.2136015325670498, "grad_norm": 14.276325225830078, "learning_rate": 4.6763157894736846e-06, "loss": 1.124, "step": 223 }, { "epoch": 0.2136015325670498, "loss_full_dim": 0.4523112177848816, "loss_main": 0.9291536808013916, "loss_parscale": 0.9296875, "loss_sub_dim": 0.4768424332141876, "loss_vclub": 0.0003719329833984375, "parscale_sim": 0.984375, "step": 223 }, { "epoch": 0.21455938697318008, "grad_norm": 8.111910820007324, "learning_rate": 4.6736842105263166e-06, "loss": 0.9292, "step": 224 }, { "epoch": 0.21455938697318008, "loss_full_dim": 0.587410032749176, "loss_main": 1.197158694267273, "loss_parscale": 1.1953125, "loss_sub_dim": 0.6097486615180969, "loss_vclub": 0.0003643035888671875, "parscale_sim": 0.984375, "step": 224 }, { "epoch": 0.21551724137931033, "grad_norm": 10.57785415649414, "learning_rate": 4.671052631578948e-06, "loss": 1.1972, "step": 225 }, { "epoch": 0.21551724137931033, "loss_full_dim": 0.5275124907493591, "loss_main": 1.079030990600586, "loss_parscale": 1.0859375, "loss_sub_dim": 0.551518440246582, "loss_vclub": 0.0004119873046875, "parscale_sim": 0.9921875, "step": 225 }, { "epoch": 0.2164750957854406, "grad_norm": 8.719523429870605, "learning_rate": 4.668421052631579e-06, "loss": 1.079, "step": 226 }, { "epoch": 0.2164750957854406, "loss_full_dim": 0.45050573348999023, "loss_main": 0.9221673011779785, "loss_parscale": 0.921875, "loss_sub_dim": 0.4716615378856659, "loss_vclub": 0.000408172607421875, "parscale_sim": 0.9921875, "step": 226 }, { "epoch": 0.21743295019157088, "grad_norm": 19.269493103027344, "learning_rate": 4.665789473684211e-06, "loss": 0.9222, "step": 227 }, { "epoch": 0.21743295019157088, "loss_full_dim": 0.4216449558734894, "loss_main": 0.8623942732810974, "loss_parscale": 0.8828125, "loss_sub_dim": 0.44074931740760803, "loss_vclub": 0.000469207763671875, "parscale_sim": 0.9921875, "step": 227 }, { "epoch": 0.21839080459770116, "grad_norm": 7.17505407333374, "learning_rate": 4.663157894736842e-06, "loss": 0.8624, "step": 228 }, { "epoch": 0.21839080459770116, "loss_full_dim": 0.5197829008102417, "loss_main": 1.0613197088241577, "loss_parscale": 1.0703125, "loss_sub_dim": 0.541536808013916, "loss_vclub": 0.000396728515625, "parscale_sim": 0.9921875, "step": 228 }, { "epoch": 0.2193486590038314, "grad_norm": 10.184402465820312, "learning_rate": 4.660526315789474e-06, "loss": 1.0613, "step": 229 }, { "epoch": 0.2193486590038314, "loss_full_dim": 0.5260148048400879, "loss_main": 1.073478102684021, "loss_parscale": 1.0859375, "loss_sub_dim": 0.5474632978439331, "loss_vclub": 0.000362396240234375, "parscale_sim": 0.9921875, "step": 229 }, { "epoch": 0.22030651340996169, "grad_norm": 8.238923072814941, "learning_rate": 4.657894736842106e-06, "loss": 1.0735, "step": 230 }, { "epoch": 0.22030651340996169, "loss_full_dim": 0.4951419234275818, "loss_main": 1.0120069980621338, "loss_parscale": 1.015625, "loss_sub_dim": 0.5168650150299072, "loss_vclub": 0.0004119873046875, "parscale_sim": 0.9921875, "step": 230 }, { "epoch": 0.22126436781609196, "grad_norm": 8.553231239318848, "learning_rate": 4.655263157894737e-06, "loss": 1.012, "step": 231 }, { "epoch": 0.22126436781609196, "loss_full_dim": 0.4860287308692932, "loss_main": 0.9950713515281677, "loss_parscale": 1.0, "loss_sub_dim": 0.5090426206588745, "loss_vclub": 0.000392913818359375, "parscale_sim": 0.9921875, "step": 231 }, { "epoch": 0.2222222222222222, "grad_norm": 8.46462345123291, "learning_rate": 4.652631578947368e-06, "loss": 0.9951, "step": 232 }, { "epoch": 0.2222222222222222, "loss_full_dim": 0.550058901309967, "loss_main": 1.122519850730896, "loss_parscale": 1.125, "loss_sub_dim": 0.572460949420929, "loss_vclub": 0.000362396240234375, "parscale_sim": 0.9921875, "step": 232 }, { "epoch": 0.2231800766283525, "grad_norm": 11.993524551391602, "learning_rate": 4.65e-06, "loss": 1.1225, "step": 233 }, { "epoch": 0.2231800766283525, "loss_full_dim": 0.4654732644557953, "loss_main": 0.9502544403076172, "loss_parscale": 0.95703125, "loss_sub_dim": 0.4847811460494995, "loss_vclub": 0.00048828125, "parscale_sim": 0.9921875, "step": 233 }, { "epoch": 0.22413793103448276, "grad_norm": 8.511637687683105, "learning_rate": 4.647368421052632e-06, "loss": 0.9503, "step": 234 }, { "epoch": 0.22413793103448276, "loss_full_dim": 0.4176832139492035, "loss_main": 0.8529937267303467, "loss_parscale": 0.8515625, "loss_sub_dim": 0.4353105425834656, "loss_vclub": 0.000446319580078125, "parscale_sim": 0.98828125, "step": 234 }, { "epoch": 0.22509578544061304, "grad_norm": 7.605699062347412, "learning_rate": 4.6447368421052635e-06, "loss": 0.853, "step": 235 }, { "epoch": 0.22509578544061304, "loss_full_dim": 0.4602102041244507, "loss_main": 0.9416458606719971, "loss_parscale": 0.953125, "loss_sub_dim": 0.4814356565475464, "loss_vclub": 0.000423431396484375, "parscale_sim": 0.9921875, "step": 235 }, { "epoch": 0.2260536398467433, "grad_norm": 7.737176895141602, "learning_rate": 4.642105263157895e-06, "loss": 0.9416, "step": 236 }, { "epoch": 0.2260536398467433, "loss_full_dim": 0.49290135502815247, "loss_main": 1.0065968036651611, "loss_parscale": 1.0, "loss_sub_dim": 0.513695478439331, "loss_vclub": 0.000392913818359375, "parscale_sim": 0.98828125, "step": 236 }, { "epoch": 0.22701149425287356, "grad_norm": 10.699085235595703, "learning_rate": 4.639473684210527e-06, "loss": 1.0066, "step": 237 }, { "epoch": 0.22701149425287356, "loss_full_dim": 0.5663456916809082, "loss_main": 1.1530635356903076, "loss_parscale": 1.15625, "loss_sub_dim": 0.5867177844047546, "loss_vclub": 0.000431060791015625, "parscale_sim": 0.99609375, "step": 237 }, { "epoch": 0.22796934865900384, "grad_norm": 9.548462867736816, "learning_rate": 4.636842105263159e-06, "loss": 1.1531, "step": 238 }, { "epoch": 0.22796934865900384, "loss_full_dim": 0.42086338996887207, "loss_main": 0.8591489791870117, "loss_parscale": 0.8515625, "loss_sub_dim": 0.43828558921813965, "loss_vclub": 0.000423431396484375, "parscale_sim": 0.98828125, "step": 238 }, { "epoch": 0.2289272030651341, "grad_norm": 8.991925239562988, "learning_rate": 4.63421052631579e-06, "loss": 0.8591, "step": 239 }, { "epoch": 0.2289272030651341, "loss_full_dim": 0.3970876634120941, "loss_main": 0.8119007349014282, "loss_parscale": 0.81640625, "loss_sub_dim": 0.4148131012916565, "loss_vclub": 0.00045013427734375, "parscale_sim": 0.9921875, "step": 239 }, { "epoch": 0.22988505747126436, "grad_norm": 6.494623184204102, "learning_rate": 4.631578947368421e-06, "loss": 0.8119, "step": 240 }, { "epoch": 0.22988505747126436, "loss_full_dim": 0.47419995069503784, "loss_main": 0.9698991179466248, "loss_parscale": 0.96875, "loss_sub_dim": 0.4956991672515869, "loss_vclub": 0.000392913818359375, "parscale_sim": 0.9921875, "step": 240 }, { "epoch": 0.23084291187739464, "grad_norm": 8.835042953491211, "learning_rate": 4.628947368421053e-06, "loss": 0.9699, "step": 241 }, { "epoch": 0.23084291187739464, "loss_full_dim": 0.5273511409759521, "loss_main": 1.0759369134902954, "loss_parscale": 1.0859375, "loss_sub_dim": 0.5485857725143433, "loss_vclub": 0.0004730224609375, "parscale_sim": 0.984375, "step": 241 }, { "epoch": 0.23180076628352492, "grad_norm": 10.336626052856445, "learning_rate": 4.626315789473684e-06, "loss": 1.0759, "step": 242 }, { "epoch": 0.23180076628352492, "loss_full_dim": 0.4913197159767151, "loss_main": 1.0007898807525635, "loss_parscale": 1.0078125, "loss_sub_dim": 0.5094701051712036, "loss_vclub": 0.00057220458984375, "parscale_sim": 0.9921875, "step": 242 }, { "epoch": 0.23275862068965517, "grad_norm": 9.211519241333008, "learning_rate": 4.623684210526316e-06, "loss": 1.0008, "step": 243 }, { "epoch": 0.23275862068965517, "loss_full_dim": 0.4852541387081146, "loss_main": 0.9942642450332642, "loss_parscale": 0.98828125, "loss_sub_dim": 0.5090101361274719, "loss_vclub": 0.00049591064453125, "parscale_sim": 0.9921875, "step": 243 }, { "epoch": 0.23371647509578544, "grad_norm": 8.892725944519043, "learning_rate": 4.621052631578948e-06, "loss": 0.9943, "step": 244 }, { "epoch": 0.23371647509578544, "loss_full_dim": 0.49711281061172485, "loss_main": 1.0158917903900146, "loss_parscale": 1.0078125, "loss_sub_dim": 0.518778920173645, "loss_vclub": 0.000400543212890625, "parscale_sim": 0.9921875, "step": 244 }, { "epoch": 0.23467432950191572, "grad_norm": 7.340822696685791, "learning_rate": 4.618421052631579e-06, "loss": 1.0159, "step": 245 }, { "epoch": 0.23467432950191572, "loss_full_dim": 0.4268127977848053, "loss_main": 0.8746825456619263, "loss_parscale": 0.890625, "loss_sub_dim": 0.44786977767944336, "loss_vclub": 0.00042724609375, "parscale_sim": 0.9921875, "step": 245 }, { "epoch": 0.23563218390804597, "grad_norm": 8.862424850463867, "learning_rate": 4.6157894736842105e-06, "loss": 0.8747, "step": 246 }, { "epoch": 0.23563218390804597, "loss_full_dim": 0.5573349595069885, "loss_main": 1.1387555599212646, "loss_parscale": 1.140625, "loss_sub_dim": 0.5814206600189209, "loss_vclub": 0.0005340576171875, "parscale_sim": 0.9921875, "step": 246 }, { "epoch": 0.23659003831417624, "grad_norm": 9.663114547729492, "learning_rate": 4.6131578947368425e-06, "loss": 1.1388, "step": 247 }, { "epoch": 0.23659003831417624, "loss_full_dim": 0.528306245803833, "loss_main": 1.0797092914581299, "loss_parscale": 1.078125, "loss_sub_dim": 0.5514030456542969, "loss_vclub": 0.0003833770751953125, "parscale_sim": 0.98828125, "step": 247 }, { "epoch": 0.23754789272030652, "grad_norm": 8.98139762878418, "learning_rate": 4.6105263157894745e-06, "loss": 1.0797, "step": 248 }, { "epoch": 0.23754789272030652, "loss_full_dim": 0.4825408458709717, "loss_main": 0.9849791526794434, "loss_parscale": 0.984375, "loss_sub_dim": 0.5024383068084717, "loss_vclub": 0.00048828125, "parscale_sim": 0.9921875, "step": 248 }, { "epoch": 0.23850574712643677, "grad_norm": 59.11452865600586, "learning_rate": 4.607894736842106e-06, "loss": 0.985, "step": 249 }, { "epoch": 0.23850574712643677, "loss_full_dim": 0.4470995366573334, "loss_main": 0.9128706455230713, "loss_parscale": 0.9140625, "loss_sub_dim": 0.4657710790634155, "loss_vclub": 0.000514984130859375, "parscale_sim": 0.98828125, "step": 249 }, { "epoch": 0.23946360153256704, "grad_norm": 8.089098930358887, "learning_rate": 4.605263157894737e-06, "loss": 0.9129, "step": 250 }, { "epoch": 0.23946360153256704, "loss_full_dim": 0.4852767884731293, "loss_main": 0.9941668510437012, "loss_parscale": 1.0, "loss_sub_dim": 0.5088900327682495, "loss_vclub": 0.00060272216796875, "parscale_sim": 0.984375, "step": 250 }, { "epoch": 0.24042145593869732, "grad_norm": 11.203875541687012, "learning_rate": 4.602631578947369e-06, "loss": 0.9942, "step": 251 }, { "epoch": 0.24042145593869732, "loss_full_dim": 0.44073402881622314, "loss_main": 0.9015941023826599, "loss_parscale": 0.8984375, "loss_sub_dim": 0.46086007356643677, "loss_vclub": 0.000457763671875, "parscale_sim": 0.9921875, "step": 251 }, { "epoch": 0.2413793103448276, "grad_norm": 9.61412525177002, "learning_rate": 4.600000000000001e-06, "loss": 0.9016, "step": 252 }, { "epoch": 0.2413793103448276, "loss_full_dim": 0.48969578742980957, "loss_main": 1.0014615058898926, "loss_parscale": 1.015625, "loss_sub_dim": 0.5117656588554382, "loss_vclub": 0.00049591064453125, "parscale_sim": 0.9921875, "step": 252 }, { "epoch": 0.24233716475095785, "grad_norm": 10.904346466064453, "learning_rate": 4.597368421052632e-06, "loss": 1.0015, "step": 253 }, { "epoch": 0.24233716475095785, "loss_full_dim": 0.454096257686615, "loss_main": 0.9294857978820801, "loss_parscale": 0.9296875, "loss_sub_dim": 0.4753895401954651, "loss_vclub": 0.00049591064453125, "parscale_sim": 0.98828125, "step": 253 }, { "epoch": 0.24329501915708812, "grad_norm": 10.038652420043945, "learning_rate": 4.594736842105263e-06, "loss": 0.9295, "step": 254 }, { "epoch": 0.24329501915708812, "loss_full_dim": 0.5073431730270386, "loss_main": 1.038255214691162, "loss_parscale": 1.046875, "loss_sub_dim": 0.5309119820594788, "loss_vclub": 0.00054168701171875, "parscale_sim": 0.98828125, "step": 254 }, { "epoch": 0.2442528735632184, "grad_norm": 7.688155174255371, "learning_rate": 4.592105263157895e-06, "loss": 1.0383, "step": 255 }, { "epoch": 0.2442528735632184, "loss_full_dim": 0.4828082323074341, "loss_main": 0.9883140921592712, "loss_parscale": 0.9921875, "loss_sub_dim": 0.5055058598518372, "loss_vclub": 0.000579833984375, "parscale_sim": 0.9921875, "step": 255 }, { "epoch": 0.24521072796934865, "grad_norm": 9.121203422546387, "learning_rate": 4.589473684210526e-06, "loss": 0.9883, "step": 256 }, { "epoch": 0.24521072796934865, "loss_full_dim": 0.489645779132843, "loss_main": 1.0017318725585938, "loss_parscale": 1.0, "loss_sub_dim": 0.512086033821106, "loss_vclub": 0.000492095947265625, "parscale_sim": 0.984375, "step": 256 }, { "epoch": 0.24616858237547892, "grad_norm": 8.611320495605469, "learning_rate": 4.586842105263158e-06, "loss": 1.0017, "step": 257 }, { "epoch": 0.24616858237547892, "loss_full_dim": 0.4855557084083557, "loss_main": 0.9925225377082825, "loss_parscale": 0.9921875, "loss_sub_dim": 0.5069668292999268, "loss_vclub": 0.000484466552734375, "parscale_sim": 0.9921875, "step": 257 }, { "epoch": 0.2471264367816092, "grad_norm": 9.76815128326416, "learning_rate": 4.5842105263157895e-06, "loss": 0.9925, "step": 258 }, { "epoch": 0.2471264367816092, "loss_full_dim": 0.4172544479370117, "loss_main": 0.8546002507209778, "loss_parscale": 0.859375, "loss_sub_dim": 0.43734580278396606, "loss_vclub": 0.00054168701171875, "parscale_sim": 0.9921875, "step": 258 }, { "epoch": 0.24808429118773948, "grad_norm": 8.38315200805664, "learning_rate": 4.5815789473684215e-06, "loss": 0.8546, "step": 259 }, { "epoch": 0.24808429118773948, "loss_full_dim": 0.413883775472641, "loss_main": 0.8475886583328247, "loss_parscale": 0.859375, "loss_sub_dim": 0.43370485305786133, "loss_vclub": 0.0004596710205078125, "parscale_sim": 0.98828125, "step": 259 }, { "epoch": 0.24904214559386972, "grad_norm": 6.42150354385376, "learning_rate": 4.578947368421053e-06, "loss": 0.8476, "step": 260 }, { "epoch": 0.24904214559386972, "loss_full_dim": 0.5152835845947266, "loss_main": 1.0520315170288086, "loss_parscale": 1.046875, "loss_sub_dim": 0.536747932434082, "loss_vclub": 0.0004520416259765625, "parscale_sim": 0.9921875, "step": 260 }, { "epoch": 0.25, "grad_norm": 7.348369121551514, "learning_rate": 4.576315789473685e-06, "loss": 1.052, "step": 261 }, { "epoch": 0.25, "loss_full_dim": 0.43916410207748413, "loss_main": 0.8979260325431824, "loss_parscale": 0.90234375, "loss_sub_dim": 0.45876193046569824, "loss_vclub": 0.000484466552734375, "parscale_sim": 0.98828125, "step": 261 }, { "epoch": 0.2509578544061303, "grad_norm": 8.055561065673828, "learning_rate": 4.573684210526317e-06, "loss": 0.8979, "step": 262 }, { "epoch": 0.2509578544061303, "loss_full_dim": 0.47594013810157776, "loss_main": 0.9698396921157837, "loss_parscale": 0.984375, "loss_sub_dim": 0.4938995838165283, "loss_vclub": 0.0005340576171875, "parscale_sim": 0.9921875, "step": 262 }, { "epoch": 0.25191570881226055, "grad_norm": 7.039929389953613, "learning_rate": 4.571052631578948e-06, "loss": 0.9698, "step": 263 }, { "epoch": 0.25191570881226055, "loss_full_dim": 0.5181564688682556, "loss_main": 1.0569794178009033, "loss_parscale": 1.0625, "loss_sub_dim": 0.5388228893280029, "loss_vclub": 0.000476837158203125, "parscale_sim": 0.9921875, "step": 263 }, { "epoch": 0.25287356321839083, "grad_norm": 9.308348655700684, "learning_rate": 4.568421052631579e-06, "loss": 1.057, "step": 264 }, { "epoch": 0.25287356321839083, "loss_full_dim": 0.5191400647163391, "loss_main": 1.0600566864013672, "loss_parscale": 1.0625, "loss_sub_dim": 0.5409166812896729, "loss_vclub": 0.000659942626953125, "parscale_sim": 0.9921875, "step": 264 }, { "epoch": 0.25383141762452105, "grad_norm": 5.814869403839111, "learning_rate": 4.565789473684211e-06, "loss": 1.0601, "step": 265 }, { "epoch": 0.25383141762452105, "loss_full_dim": 0.45739492774009705, "loss_main": 0.9344923496246338, "loss_parscale": 0.9453125, "loss_sub_dim": 0.47709739208221436, "loss_vclub": 0.000446319580078125, "parscale_sim": 0.9921875, "step": 265 }, { "epoch": 0.2547892720306513, "grad_norm": 17.09619140625, "learning_rate": 4.563157894736843e-06, "loss": 0.9345, "step": 266 }, { "epoch": 0.2547892720306513, "loss_full_dim": 0.48758506774902344, "loss_main": 0.9943277835845947, "loss_parscale": 1.0078125, "loss_sub_dim": 0.5067427158355713, "loss_vclub": 0.00051116943359375, "parscale_sim": 0.9921875, "step": 266 }, { "epoch": 0.2557471264367816, "grad_norm": 7.746295928955078, "learning_rate": 4.560526315789474e-06, "loss": 0.9943, "step": 267 }, { "epoch": 0.2557471264367816, "loss_full_dim": 0.4630741477012634, "loss_main": 0.9484955072402954, "loss_parscale": 0.94140625, "loss_sub_dim": 0.485421359539032, "loss_vclub": 0.00054931640625, "parscale_sim": 0.9921875, "step": 267 }, { "epoch": 0.2567049808429119, "grad_norm": 9.203831672668457, "learning_rate": 4.557894736842105e-06, "loss": 0.9485, "step": 268 }, { "epoch": 0.2567049808429119, "loss_full_dim": 0.47618359327316284, "loss_main": 0.9711581468582153, "loss_parscale": 0.96875, "loss_sub_dim": 0.4949745833873749, "loss_vclub": 0.00046539306640625, "parscale_sim": 0.984375, "step": 268 }, { "epoch": 0.25766283524904215, "grad_norm": 7.7073140144348145, "learning_rate": 4.555263157894737e-06, "loss": 0.9712, "step": 269 }, { "epoch": 0.25766283524904215, "loss_full_dim": 0.4941484332084656, "loss_main": 1.0097227096557617, "loss_parscale": 1.03125, "loss_sub_dim": 0.5155743360519409, "loss_vclub": 0.00041961669921875, "parscale_sim": 0.9921875, "step": 269 }, { "epoch": 0.25862068965517243, "grad_norm": 8.010236740112305, "learning_rate": 4.552631578947369e-06, "loss": 1.0097, "step": 270 }, { "epoch": 0.25862068965517243, "loss_full_dim": 0.488547682762146, "loss_main": 0.9992552995681763, "loss_parscale": 0.9921875, "loss_sub_dim": 0.5107076168060303, "loss_vclub": 0.00048065185546875, "parscale_sim": 0.9921875, "step": 270 }, { "epoch": 0.2595785440613027, "grad_norm": 11.0455904006958, "learning_rate": 4.5500000000000005e-06, "loss": 0.9993, "step": 271 }, { "epoch": 0.2595785440613027, "loss_full_dim": 0.41027581691741943, "loss_main": 0.8413853049278259, "loss_parscale": 0.84375, "loss_sub_dim": 0.4311094880104065, "loss_vclub": 0.000484466552734375, "parscale_sim": 0.9921875, "step": 271 }, { "epoch": 0.26053639846743293, "grad_norm": 8.0972318649292, "learning_rate": 4.547368421052632e-06, "loss": 0.8414, "step": 272 }, { "epoch": 0.26053639846743293, "loss_full_dim": 0.4256237745285034, "loss_main": 0.8713397979736328, "loss_parscale": 0.8671875, "loss_sub_dim": 0.4457160234451294, "loss_vclub": 0.00042724609375, "parscale_sim": 0.9921875, "step": 272 }, { "epoch": 0.2614942528735632, "grad_norm": 6.348586559295654, "learning_rate": 4.544736842105264e-06, "loss": 0.8713, "step": 273 }, { "epoch": 0.2614942528735632, "loss_full_dim": 0.46642228960990906, "loss_main": 0.9515293836593628, "loss_parscale": 0.94140625, "loss_sub_dim": 0.48510709404945374, "loss_vclub": 0.0004177093505859375, "parscale_sim": 0.98828125, "step": 273 }, { "epoch": 0.2624521072796935, "grad_norm": 8.78376579284668, "learning_rate": 4.542105263157895e-06, "loss": 0.9515, "step": 274 }, { "epoch": 0.2624521072796935, "loss_full_dim": 0.5247511863708496, "loss_main": 1.0738792419433594, "loss_parscale": 1.078125, "loss_sub_dim": 0.5491281151771545, "loss_vclub": 0.0004730224609375, "parscale_sim": 0.9921875, "step": 274 }, { "epoch": 0.26340996168582376, "grad_norm": 7.737121105194092, "learning_rate": 4.539473684210527e-06, "loss": 1.0739, "step": 275 }, { "epoch": 0.26340996168582376, "loss_full_dim": 0.49684369564056396, "loss_main": 1.014967441558838, "loss_parscale": 1.0078125, "loss_sub_dim": 0.5181237459182739, "loss_vclub": 0.000545501708984375, "parscale_sim": 0.9921875, "step": 275 }, { "epoch": 0.26436781609195403, "grad_norm": 8.31530475616455, "learning_rate": 4.536842105263158e-06, "loss": 1.015, "step": 276 }, { "epoch": 0.26436781609195403, "loss_full_dim": 0.49680209159851074, "loss_main": 1.013606071472168, "loss_parscale": 1.0078125, "loss_sub_dim": 0.5168039798736572, "loss_vclub": 0.0005950927734375, "parscale_sim": 0.984375, "step": 276 }, { "epoch": 0.2653256704980843, "grad_norm": 10.129792213439941, "learning_rate": 4.53421052631579e-06, "loss": 1.0136, "step": 277 }, { "epoch": 0.2653256704980843, "loss_full_dim": 0.44285112619400024, "loss_main": 0.9033362865447998, "loss_parscale": 0.91015625, "loss_sub_dim": 0.46048516035079956, "loss_vclub": 0.000598907470703125, "parscale_sim": 0.9921875, "step": 277 }, { "epoch": 0.2662835249042146, "grad_norm": 8.688750267028809, "learning_rate": 4.531578947368421e-06, "loss": 0.9033, "step": 278 }, { "epoch": 0.2662835249042146, "loss_full_dim": 0.43428507447242737, "loss_main": 0.8864010572433472, "loss_parscale": 0.88671875, "loss_sub_dim": 0.4521159529685974, "loss_vclub": 0.000431060791015625, "parscale_sim": 0.9921875, "step": 278 }, { "epoch": 0.2672413793103448, "grad_norm": 8.43358039855957, "learning_rate": 4.528947368421053e-06, "loss": 0.8864, "step": 279 }, { "epoch": 0.2672413793103448, "loss_full_dim": 0.4282614588737488, "loss_main": 0.8756113648414612, "loss_parscale": 0.875, "loss_sub_dim": 0.4473499059677124, "loss_vclub": 0.00048828125, "parscale_sim": 0.9921875, "step": 279 }, { "epoch": 0.2681992337164751, "grad_norm": 7.135706424713135, "learning_rate": 4.526315789473685e-06, "loss": 0.8756, "step": 280 }, { "epoch": 0.2681992337164751, "loss_full_dim": 0.4786289930343628, "loss_main": 0.9790223240852356, "loss_parscale": 0.98828125, "loss_sub_dim": 0.5003933310508728, "loss_vclub": 0.000438690185546875, "parscale_sim": 0.98828125, "step": 280 }, { "epoch": 0.26915708812260536, "grad_norm": 9.867084503173828, "learning_rate": 4.523684210526316e-06, "loss": 0.979, "step": 281 }, { "epoch": 0.26915708812260536, "loss_full_dim": 0.4841550886631012, "loss_main": 0.9887421131134033, "loss_parscale": 0.984375, "loss_sub_dim": 0.5045870542526245, "loss_vclub": 0.000492095947265625, "parscale_sim": 0.9921875, "step": 281 }, { "epoch": 0.27011494252873564, "grad_norm": 9.92682933807373, "learning_rate": 4.5210526315789475e-06, "loss": 0.9887, "step": 282 }, { "epoch": 0.27011494252873564, "loss_full_dim": 0.4865942895412445, "loss_main": 0.9977622032165527, "loss_parscale": 1.015625, "loss_sub_dim": 0.5111679434776306, "loss_vclub": 0.0004711151123046875, "parscale_sim": 0.9921875, "step": 282 }, { "epoch": 0.2710727969348659, "grad_norm": 10.110612869262695, "learning_rate": 4.5184210526315795e-06, "loss": 0.9978, "step": 283 }, { "epoch": 0.2710727969348659, "loss_full_dim": 0.5175797343254089, "loss_main": 1.0597131252288818, "loss_parscale": 1.078125, "loss_sub_dim": 0.5421334505081177, "loss_vclub": 0.0004291534423828125, "parscale_sim": 0.9921875, "step": 283 }, { "epoch": 0.2720306513409962, "grad_norm": 10.729455947875977, "learning_rate": 4.5157894736842115e-06, "loss": 1.0597, "step": 284 }, { "epoch": 0.2720306513409962, "loss_full_dim": 0.4879951477050781, "loss_main": 0.9989351630210876, "loss_parscale": 1.0, "loss_sub_dim": 0.5109400153160095, "loss_vclub": 0.0004177093505859375, "parscale_sim": 0.98828125, "step": 284 }, { "epoch": 0.27298850574712646, "grad_norm": 57.799564361572266, "learning_rate": 4.513157894736843e-06, "loss": 0.9989, "step": 285 }, { "epoch": 0.27298850574712646, "loss_full_dim": 0.4716193675994873, "loss_main": 0.9638434052467346, "loss_parscale": 0.96875, "loss_sub_dim": 0.4922240376472473, "loss_vclub": 0.00049591064453125, "parscale_sim": 0.98828125, "step": 285 }, { "epoch": 0.2739463601532567, "grad_norm": 6.971296787261963, "learning_rate": 4.510526315789474e-06, "loss": 0.9638, "step": 286 }, { "epoch": 0.2739463601532567, "loss_full_dim": 0.47011256217956543, "loss_main": 0.9612969160079956, "loss_parscale": 0.984375, "loss_sub_dim": 0.49118438363075256, "loss_vclub": 0.00055694580078125, "parscale_sim": 0.9921875, "step": 286 }, { "epoch": 0.27490421455938696, "grad_norm": 9.672253608703613, "learning_rate": 4.507894736842106e-06, "loss": 0.9613, "step": 287 }, { "epoch": 0.27490421455938696, "loss_full_dim": 0.4912416338920593, "loss_main": 1.0043022632598877, "loss_parscale": 1.0078125, "loss_sub_dim": 0.5130605697631836, "loss_vclub": 0.00054931640625, "parscale_sim": 0.9921875, "step": 287 }, { "epoch": 0.27586206896551724, "grad_norm": 8.60017204284668, "learning_rate": 4.505263157894737e-06, "loss": 1.0043, "step": 288 }, { "epoch": 0.27586206896551724, "loss_full_dim": 0.41232118010520935, "loss_main": 0.8434847593307495, "loss_parscale": 0.8515625, "loss_sub_dim": 0.43116360902786255, "loss_vclub": 0.0004119873046875, "parscale_sim": 0.9921875, "step": 288 }, { "epoch": 0.2768199233716475, "grad_norm": 7.780846118927002, "learning_rate": 4.502631578947369e-06, "loss": 0.8435, "step": 289 }, { "epoch": 0.2768199233716475, "loss_full_dim": 0.38568833470344543, "loss_main": 0.790361762046814, "loss_parscale": 0.796875, "loss_sub_dim": 0.40467342734336853, "loss_vclub": 0.00060272216796875, "parscale_sim": 0.9921875, "step": 289 }, { "epoch": 0.2777777777777778, "grad_norm": 10.018383979797363, "learning_rate": 4.5e-06, "loss": 0.7904, "step": 290 }, { "epoch": 0.2777777777777778, "loss_full_dim": 0.4772637188434601, "loss_main": 0.9755034446716309, "loss_parscale": 0.9921875, "loss_sub_dim": 0.49823975563049316, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.984375, "step": 290 }, { "epoch": 0.27873563218390807, "grad_norm": 11.992202758789062, "learning_rate": 4.497368421052632e-06, "loss": 0.9755, "step": 291 }, { "epoch": 0.27873563218390807, "loss_full_dim": 0.4053886830806732, "loss_main": 0.8284227252006531, "loss_parscale": 0.84375, "loss_sub_dim": 0.42303404211997986, "loss_vclub": 0.00041961669921875, "parscale_sim": 0.98828125, "step": 291 }, { "epoch": 0.2796934865900383, "grad_norm": 7.830506324768066, "learning_rate": 4.494736842105263e-06, "loss": 0.8284, "step": 292 }, { "epoch": 0.2796934865900383, "loss_full_dim": 0.42946308851242065, "loss_main": 0.8784309029579163, "loss_parscale": 0.8984375, "loss_sub_dim": 0.4489678144454956, "loss_vclub": 0.000553131103515625, "parscale_sim": 0.9921875, "step": 292 }, { "epoch": 0.28065134099616856, "grad_norm": 9.926318168640137, "learning_rate": 4.4921052631578944e-06, "loss": 0.8784, "step": 293 }, { "epoch": 0.28065134099616856, "loss_full_dim": 0.3919347822666168, "loss_main": 0.8038612604141235, "loss_parscale": 0.8046875, "loss_sub_dim": 0.4119264483451843, "loss_vclub": 0.000579833984375, "parscale_sim": 0.9921875, "step": 293 }, { "epoch": 0.28160919540229884, "grad_norm": 9.228681564331055, "learning_rate": 4.489473684210527e-06, "loss": 0.8039, "step": 294 }, { "epoch": 0.28160919540229884, "loss_full_dim": 0.4693540036678314, "loss_main": 0.9591619372367859, "loss_parscale": 0.953125, "loss_sub_dim": 0.48980793356895447, "loss_vclub": 0.000537872314453125, "parscale_sim": 0.9921875, "step": 294 }, { "epoch": 0.2825670498084291, "grad_norm": 317.6538391113281, "learning_rate": 4.4868421052631584e-06, "loss": 0.9592, "step": 295 }, { "epoch": 0.2825670498084291, "loss_full_dim": 0.4816410541534424, "loss_main": 0.9809387922286987, "loss_parscale": 0.9921875, "loss_sub_dim": 0.49929773807525635, "loss_vclub": 0.000629425048828125, "parscale_sim": 0.98828125, "step": 295 }, { "epoch": 0.2835249042145594, "grad_norm": 7.8686676025390625, "learning_rate": 4.48421052631579e-06, "loss": 0.9809, "step": 296 }, { "epoch": 0.2835249042145594, "loss_full_dim": 0.47537028789520264, "loss_main": 0.9698467254638672, "loss_parscale": 0.9765625, "loss_sub_dim": 0.49447643756866455, "loss_vclub": 0.0004730224609375, "parscale_sim": 0.9921875, "step": 296 }, { "epoch": 0.28448275862068967, "grad_norm": 10.316503524780273, "learning_rate": 4.481578947368422e-06, "loss": 0.9698, "step": 297 }, { "epoch": 0.28448275862068967, "loss_full_dim": 0.5250135660171509, "loss_main": 1.068982720375061, "loss_parscale": 1.078125, "loss_sub_dim": 0.5439691543579102, "loss_vclub": 0.0004730224609375, "parscale_sim": 0.9921875, "step": 297 }, { "epoch": 0.28544061302681994, "grad_norm": 7.51985502243042, "learning_rate": 4.478947368421054e-06, "loss": 1.069, "step": 298 }, { "epoch": 0.28544061302681994, "loss_full_dim": 0.4086743891239166, "loss_main": 0.835088312625885, "loss_parscale": 0.83984375, "loss_sub_dim": 0.4264139235019684, "loss_vclub": 0.000579833984375, "parscale_sim": 0.9921875, "step": 298 }, { "epoch": 0.28639846743295017, "grad_norm": 8.230060577392578, "learning_rate": 4.476315789473685e-06, "loss": 0.8351, "step": 299 }, { "epoch": 0.28639846743295017, "loss_full_dim": 0.4829764664173126, "loss_main": 0.9825379848480225, "loss_parscale": 0.984375, "loss_sub_dim": 0.4995615482330322, "loss_vclub": 0.0005340576171875, "parscale_sim": 0.98828125, "step": 299 }, { "epoch": 0.28735632183908044, "grad_norm": 6.964096546173096, "learning_rate": 4.473684210526316e-06, "loss": 0.9825, "step": 300 }, { "epoch": 0.28735632183908044, "loss_full_dim": 0.48644497990608215, "loss_main": 0.9941908121109009, "loss_parscale": 1.0, "loss_sub_dim": 0.5077458620071411, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.9921875, "step": 300 }, { "epoch": 0.2883141762452107, "grad_norm": 6.711770057678223, "learning_rate": 4.471052631578948e-06, "loss": 0.9942, "step": 301 }, { "epoch": 0.2883141762452107, "loss_full_dim": 0.5153290033340454, "loss_main": 1.0513527393341064, "loss_parscale": 1.0625, "loss_sub_dim": 0.5360236763954163, "loss_vclub": 0.0005645751953125, "parscale_sim": 0.984375, "step": 301 }, { "epoch": 0.289272030651341, "grad_norm": 10.167815208435059, "learning_rate": 4.468421052631579e-06, "loss": 1.0514, "step": 302 }, { "epoch": 0.289272030651341, "loss_full_dim": 0.4262804687023163, "loss_main": 0.8712112903594971, "loss_parscale": 0.875, "loss_sub_dim": 0.4449308216571808, "loss_vclub": 0.000736236572265625, "parscale_sim": 0.9921875, "step": 302 }, { "epoch": 0.29022988505747127, "grad_norm": 12.11451530456543, "learning_rate": 4.465789473684211e-06, "loss": 0.8712, "step": 303 }, { "epoch": 0.29022988505747127, "loss_full_dim": 0.49116358160972595, "loss_main": 1.0046639442443848, "loss_parscale": 1.015625, "loss_sub_dim": 0.5135003924369812, "loss_vclub": 0.00043487548828125, "parscale_sim": 0.9921875, "step": 303 }, { "epoch": 0.29118773946360155, "grad_norm": 104.3197021484375, "learning_rate": 4.463157894736842e-06, "loss": 1.0047, "step": 304 }, { "epoch": 0.29118773946360155, "loss_full_dim": 0.41620728373527527, "loss_main": 0.850401759147644, "loss_parscale": 0.859375, "loss_sub_dim": 0.43419450521469116, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.9921875, "step": 304 }, { "epoch": 0.2921455938697318, "grad_norm": 12.047974586486816, "learning_rate": 4.460526315789474e-06, "loss": 0.8504, "step": 305 }, { "epoch": 0.2921455938697318, "loss_full_dim": 0.4282454550266266, "loss_main": 0.874946117401123, "loss_parscale": 0.87109375, "loss_sub_dim": 0.4467006325721741, "loss_vclub": 0.0004329681396484375, "parscale_sim": 0.96484375, "step": 305 }, { "epoch": 0.29310344827586204, "grad_norm": 6.665388584136963, "learning_rate": 4.4578947368421054e-06, "loss": 0.8749, "step": 306 }, { "epoch": 0.29310344827586204, "loss_full_dim": 0.5539806485176086, "loss_main": 1.1298489570617676, "loss_parscale": 1.125, "loss_sub_dim": 0.5758683681488037, "loss_vclub": 0.000499725341796875, "parscale_sim": 0.9921875, "step": 306 }, { "epoch": 0.2940613026819923, "grad_norm": 11.60236644744873, "learning_rate": 4.455263157894737e-06, "loss": 1.1298, "step": 307 }, { "epoch": 0.2940613026819923, "loss_full_dim": 0.5029986500740051, "loss_main": 1.033308982849121, "loss_parscale": 1.03125, "loss_sub_dim": 0.5303102731704712, "loss_vclub": 0.000759124755859375, "parscale_sim": 0.9921875, "step": 307 }, { "epoch": 0.2950191570881226, "grad_norm": 32.57913589477539, "learning_rate": 4.452631578947369e-06, "loss": 1.0333, "step": 308 }, { "epoch": 0.2950191570881226, "loss_full_dim": 0.6013935804367065, "loss_main": 1.2276718616485596, "loss_parscale": 1.21875, "loss_sub_dim": 0.6262782216072083, "loss_vclub": 0.000659942626953125, "parscale_sim": 0.98828125, "step": 308 }, { "epoch": 0.2959770114942529, "grad_norm": 17.676620483398438, "learning_rate": 4.450000000000001e-06, "loss": 1.2277, "step": 309 }, { "epoch": 0.2959770114942529, "loss_full_dim": 0.4220571517944336, "loss_main": 0.8677573800086975, "loss_parscale": 0.87109375, "loss_sub_dim": 0.4457002282142639, "loss_vclub": 0.000576019287109375, "parscale_sim": 0.9921875, "step": 309 }, { "epoch": 0.29693486590038315, "grad_norm": 8.702763557434082, "learning_rate": 4.447368421052632e-06, "loss": 0.8678, "step": 310 }, { "epoch": 0.29693486590038315, "loss_full_dim": 0.4918500483036041, "loss_main": 1.0065257549285889, "loss_parscale": 0.9921875, "loss_sub_dim": 0.5146757364273071, "loss_vclub": 0.0005950927734375, "parscale_sim": 0.9921875, "step": 310 }, { "epoch": 0.2978927203065134, "grad_norm": 8.291084289550781, "learning_rate": 4.444736842105264e-06, "loss": 1.0065, "step": 311 }, { "epoch": 0.2978927203065134, "loss_full_dim": 0.6543565392494202, "loss_main": 1.3387898206710815, "loss_parscale": 1.3359375, "loss_sub_dim": 0.6844332814216614, "loss_vclub": 0.000522613525390625, "parscale_sim": 0.98828125, "step": 311 }, { "epoch": 0.2988505747126437, "grad_norm": 15.343417167663574, "learning_rate": 4.442105263157896e-06, "loss": 1.3388, "step": 312 }, { "epoch": 0.2988505747126437, "loss_full_dim": 0.43776777386665344, "loss_main": 0.9008938074111938, "loss_parscale": 0.8984375, "loss_sub_dim": 0.463126003742218, "loss_vclub": 0.00054931640625, "parscale_sim": 0.984375, "step": 312 }, { "epoch": 0.2998084291187739, "grad_norm": 10.44201374053955, "learning_rate": 4.439473684210527e-06, "loss": 0.9009, "step": 313 }, { "epoch": 0.2998084291187739, "loss_full_dim": 0.4893105924129486, "loss_main": 1.0049819946289062, "loss_parscale": 1.0, "loss_sub_dim": 0.51567143201828, "loss_vclub": 0.000537872314453125, "parscale_sim": 0.9921875, "step": 313 }, { "epoch": 0.3007662835249042, "grad_norm": 18.128196716308594, "learning_rate": 4.436842105263158e-06, "loss": 1.005, "step": 314 }, { "epoch": 0.3007662835249042, "loss_full_dim": 0.4891900420188904, "loss_main": 1.0023365020751953, "loss_parscale": 1.03125, "loss_sub_dim": 0.5131464004516602, "loss_vclub": 0.00067138671875, "parscale_sim": 0.9921875, "step": 314 }, { "epoch": 0.3017241379310345, "grad_norm": 30.361732482910156, "learning_rate": 4.43421052631579e-06, "loss": 1.0023, "step": 315 }, { "epoch": 0.3017241379310345, "loss_full_dim": 0.4714735746383667, "loss_main": 0.9652542471885681, "loss_parscale": 0.96875, "loss_sub_dim": 0.4937806725502014, "loss_vclub": 0.000675201416015625, "parscale_sim": 0.98828125, "step": 315 }, { "epoch": 0.30268199233716475, "grad_norm": 18.127702713012695, "learning_rate": 4.431578947368421e-06, "loss": 0.9653, "step": 316 }, { "epoch": 0.30268199233716475, "loss_full_dim": 0.4689173996448517, "loss_main": 0.9620754718780518, "loss_parscale": 0.9609375, "loss_sub_dim": 0.49315810203552246, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.98828125, "step": 316 }, { "epoch": 0.303639846743295, "grad_norm": 7.161415100097656, "learning_rate": 4.428947368421053e-06, "loss": 0.9621, "step": 317 }, { "epoch": 0.303639846743295, "loss_full_dim": 0.46173739433288574, "loss_main": 0.943759560585022, "loss_parscale": 0.9375, "loss_sub_dim": 0.48202216625213623, "loss_vclub": 0.00051116943359375, "parscale_sim": 0.98828125, "step": 317 }, { "epoch": 0.3045977011494253, "grad_norm": 9.09197998046875, "learning_rate": 4.426315789473684e-06, "loss": 0.9438, "step": 318 }, { "epoch": 0.3045977011494253, "loss_full_dim": 0.4455729126930237, "loss_main": 0.9113483428955078, "loss_parscale": 0.921875, "loss_sub_dim": 0.46577543020248413, "loss_vclub": 0.000579833984375, "parscale_sim": 0.9921875, "step": 318 }, { "epoch": 0.3055555555555556, "grad_norm": 9.6340970993042, "learning_rate": 4.423684210526316e-06, "loss": 0.9113, "step": 319 }, { "epoch": 0.3055555555555556, "loss_full_dim": 0.42382410168647766, "loss_main": 0.8672462701797485, "loss_parscale": 0.875, "loss_sub_dim": 0.4434221684932709, "loss_vclub": 0.000568389892578125, "parscale_sim": 0.9921875, "step": 319 }, { "epoch": 0.3065134099616858, "grad_norm": 9.00440788269043, "learning_rate": 4.4210526315789476e-06, "loss": 0.8672, "step": 320 }, { "epoch": 0.3065134099616858, "loss_full_dim": 0.46930205821990967, "loss_main": 0.9599835872650146, "loss_parscale": 0.96484375, "loss_sub_dim": 0.49068155884742737, "loss_vclub": 0.000640869140625, "parscale_sim": 0.9921875, "step": 320 }, { "epoch": 0.3074712643678161, "grad_norm": 13.007828712463379, "learning_rate": 4.418421052631579e-06, "loss": 0.96, "step": 321 }, { "epoch": 0.3074712643678161, "loss_full_dim": 0.4338834881782532, "loss_main": 0.8896158933639526, "loss_parscale": 0.89453125, "loss_sub_dim": 0.45573243498802185, "loss_vclub": 0.000701904296875, "parscale_sim": 0.984375, "step": 321 }, { "epoch": 0.30842911877394635, "grad_norm": 8.276413917541504, "learning_rate": 4.415789473684211e-06, "loss": 0.8896, "step": 322 }, { "epoch": 0.30842911877394635, "loss_full_dim": 0.46873652935028076, "loss_main": 0.9563747048377991, "loss_parscale": 0.953125, "loss_sub_dim": 0.4876381754875183, "loss_vclub": 0.0005035400390625, "parscale_sim": 0.98828125, "step": 322 }, { "epoch": 0.30938697318007663, "grad_norm": 9.484288215637207, "learning_rate": 4.413157894736843e-06, "loss": 0.9564, "step": 323 }, { "epoch": 0.30938697318007663, "loss_full_dim": 0.5027353763580322, "loss_main": 1.0241730213165283, "loss_parscale": 1.03125, "loss_sub_dim": 0.5214375853538513, "loss_vclub": 0.0005035400390625, "parscale_sim": 0.98828125, "step": 323 }, { "epoch": 0.3103448275862069, "grad_norm": 11.048410415649414, "learning_rate": 4.410526315789474e-06, "loss": 1.0242, "step": 324 }, { "epoch": 0.3103448275862069, "loss_full_dim": 0.39006057381629944, "loss_main": 0.7995771169662476, "loss_parscale": 0.8046875, "loss_sub_dim": 0.4095165729522705, "loss_vclub": 0.00054931640625, "parscale_sim": 0.98828125, "step": 324 }, { "epoch": 0.3113026819923372, "grad_norm": 22.24156379699707, "learning_rate": 4.407894736842105e-06, "loss": 0.7996, "step": 325 }, { "epoch": 0.3113026819923372, "loss_full_dim": 0.4136107861995697, "loss_main": 0.8475766181945801, "loss_parscale": 0.859375, "loss_sub_dim": 0.43396586179733276, "loss_vclub": 0.000644683837890625, "parscale_sim": 0.9921875, "step": 325 }, { "epoch": 0.31226053639846746, "grad_norm": 9.443460464477539, "learning_rate": 4.405263157894737e-06, "loss": 0.8476, "step": 326 }, { "epoch": 0.31226053639846746, "loss_full_dim": 0.49333277344703674, "loss_main": 1.0080206394195557, "loss_parscale": 0.99609375, "loss_sub_dim": 0.5146878957748413, "loss_vclub": 0.0006256103515625, "parscale_sim": 0.9921875, "step": 326 }, { "epoch": 0.3132183908045977, "grad_norm": 10.453150749206543, "learning_rate": 4.402631578947369e-06, "loss": 1.008, "step": 327 }, { "epoch": 0.3132183908045977, "loss_full_dim": 0.5180562734603882, "loss_main": 1.0609155893325806, "loss_parscale": 1.0625, "loss_sub_dim": 0.5428593158721924, "loss_vclub": 0.00051116943359375, "parscale_sim": 0.9921875, "step": 327 }, { "epoch": 0.31417624521072796, "grad_norm": 12.630012512207031, "learning_rate": 4.4e-06, "loss": 1.0609, "step": 328 }, { "epoch": 0.31417624521072796, "loss_full_dim": 0.5070019364356995, "loss_main": 1.0368294715881348, "loss_parscale": 1.03125, "loss_sub_dim": 0.5298275947570801, "loss_vclub": 0.000530242919921875, "parscale_sim": 0.9921875, "step": 328 }, { "epoch": 0.31513409961685823, "grad_norm": 12.612765312194824, "learning_rate": 4.397368421052632e-06, "loss": 1.0368, "step": 329 }, { "epoch": 0.31513409961685823, "loss_full_dim": 0.5222896337509155, "loss_main": 1.0713374614715576, "loss_parscale": 1.0703125, "loss_sub_dim": 0.5490477681159973, "loss_vclub": 0.000576019287109375, "parscale_sim": 0.95703125, "step": 329 }, { "epoch": 0.3160919540229885, "grad_norm": 10.087514877319336, "learning_rate": 4.394736842105263e-06, "loss": 1.0713, "step": 330 }, { "epoch": 0.3160919540229885, "loss_full_dim": 0.5330392718315125, "loss_main": 1.0965280532836914, "loss_parscale": 1.125, "loss_sub_dim": 0.5634888410568237, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.98828125, "step": 330 }, { "epoch": 0.3170498084291188, "grad_norm": 24.734272003173828, "learning_rate": 4.392105263157895e-06, "loss": 1.0965, "step": 331 }, { "epoch": 0.3170498084291188, "loss_full_dim": 0.5459811687469482, "loss_main": 1.1174001693725586, "loss_parscale": 1.1171875, "loss_sub_dim": 0.5714190006256104, "loss_vclub": 0.000579833984375, "parscale_sim": 0.97265625, "step": 331 }, { "epoch": 0.31800766283524906, "grad_norm": 42.24786376953125, "learning_rate": 4.3894736842105266e-06, "loss": 1.1174, "step": 332 }, { "epoch": 0.31800766283524906, "loss_full_dim": 0.4729773998260498, "loss_main": 0.9700703620910645, "loss_parscale": 0.96875, "loss_sub_dim": 0.49709296226501465, "loss_vclub": 0.000518798828125, "parscale_sim": 0.9765625, "step": 332 }, { "epoch": 0.31896551724137934, "grad_norm": 11.9762601852417, "learning_rate": 4.3868421052631586e-06, "loss": 0.9701, "step": 333 }, { "epoch": 0.31896551724137934, "loss_full_dim": 0.4085378348827362, "loss_main": 0.837844967842102, "loss_parscale": 0.8515625, "loss_sub_dim": 0.42930713295936584, "loss_vclub": 0.00055694580078125, "parscale_sim": 0.98828125, "step": 333 }, { "epoch": 0.31992337164750956, "grad_norm": 6.045828342437744, "learning_rate": 4.38421052631579e-06, "loss": 0.8378, "step": 334 }, { "epoch": 0.31992337164750956, "loss_full_dim": 0.46609607338905334, "loss_main": 0.9556998014450073, "loss_parscale": 0.94921875, "loss_sub_dim": 0.4896036982536316, "loss_vclub": 0.000484466552734375, "parscale_sim": 0.98828125, "step": 334 }, { "epoch": 0.32088122605363983, "grad_norm": 10.40355110168457, "learning_rate": 4.381578947368421e-06, "loss": 0.9557, "step": 335 }, { "epoch": 0.32088122605363983, "loss_full_dim": 0.4909511208534241, "loss_main": 1.0056843757629395, "loss_parscale": 1.015625, "loss_sub_dim": 0.5147333145141602, "loss_vclub": 0.0005645751953125, "parscale_sim": 0.98828125, "step": 335 }, { "epoch": 0.3218390804597701, "grad_norm": 7.5517706871032715, "learning_rate": 4.378947368421053e-06, "loss": 1.0057, "step": 336 }, { "epoch": 0.3218390804597701, "loss_full_dim": 0.5095177292823792, "loss_main": 1.0409655570983887, "loss_parscale": 1.03125, "loss_sub_dim": 0.5314477682113647, "loss_vclub": 0.00064849853515625, "parscale_sim": 0.98828125, "step": 336 }, { "epoch": 0.3227969348659004, "grad_norm": 9.129403114318848, "learning_rate": 4.376315789473685e-06, "loss": 1.041, "step": 337 }, { "epoch": 0.3227969348659004, "loss_full_dim": 0.4848366677761078, "loss_main": 0.9939152002334595, "loss_parscale": 0.9921875, "loss_sub_dim": 0.5090785026550293, "loss_vclub": 0.000720977783203125, "parscale_sim": 0.9921875, "step": 337 }, { "epoch": 0.32375478927203066, "grad_norm": 31.46364402770996, "learning_rate": 4.373684210526316e-06, "loss": 0.9939, "step": 338 }, { "epoch": 0.32375478927203066, "loss_full_dim": 0.48932337760925293, "loss_main": 1.0020802021026611, "loss_parscale": 1.0078125, "loss_sub_dim": 0.5127568244934082, "loss_vclub": 0.000507354736328125, "parscale_sim": 0.98828125, "step": 338 }, { "epoch": 0.32471264367816094, "grad_norm": 9.905885696411133, "learning_rate": 4.371052631578947e-06, "loss": 1.0021, "step": 339 }, { "epoch": 0.32471264367816094, "loss_full_dim": 0.4867449998855591, "loss_main": 1.0004055500030518, "loss_parscale": 1.015625, "loss_sub_dim": 0.5136605501174927, "loss_vclub": 0.000606536865234375, "parscale_sim": 0.9921875, "step": 339 }, { "epoch": 0.32567049808429116, "grad_norm": 9.661269187927246, "learning_rate": 4.368421052631579e-06, "loss": 1.0004, "step": 340 }, { "epoch": 0.32567049808429116, "loss_full_dim": 0.4595504105091095, "loss_main": 0.9442905187606812, "loss_parscale": 0.953125, "loss_sub_dim": 0.48474007844924927, "loss_vclub": 0.00055694580078125, "parscale_sim": 0.96875, "step": 340 }, { "epoch": 0.32662835249042144, "grad_norm": 6.9442338943481445, "learning_rate": 4.365789473684211e-06, "loss": 0.9443, "step": 341 }, { "epoch": 0.32662835249042144, "loss_full_dim": 0.48710355162620544, "loss_main": 0.9938786029815674, "loss_parscale": 0.9921875, "loss_sub_dim": 0.5067750215530396, "loss_vclub": 0.0006103515625, "parscale_sim": 0.984375, "step": 341 }, { "epoch": 0.3275862068965517, "grad_norm": 10.082763671875, "learning_rate": 4.363157894736842e-06, "loss": 0.9939, "step": 342 }, { "epoch": 0.3275862068965517, "loss_full_dim": 0.40296435356140137, "loss_main": 0.8258755207061768, "loss_parscale": 0.82421875, "loss_sub_dim": 0.422911137342453, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.984375, "step": 342 }, { "epoch": 0.328544061302682, "grad_norm": 8.580089569091797, "learning_rate": 4.3605263157894735e-06, "loss": 0.8259, "step": 343 }, { "epoch": 0.328544061302682, "loss_full_dim": 0.44647836685180664, "loss_main": 0.9130740165710449, "loss_parscale": 0.9375, "loss_sub_dim": 0.4665956199169159, "loss_vclub": 0.000606536865234375, "parscale_sim": 0.9921875, "step": 343 }, { "epoch": 0.32950191570881227, "grad_norm": 25.423660278320312, "learning_rate": 4.3578947368421055e-06, "loss": 0.9131, "step": 344 }, { "epoch": 0.32950191570881227, "loss_full_dim": 0.48322632908821106, "loss_main": 0.9901934862136841, "loss_parscale": 1.015625, "loss_sub_dim": 0.5069671869277954, "loss_vclub": 0.000659942626953125, "parscale_sim": 0.9921875, "step": 344 }, { "epoch": 0.33045977011494254, "grad_norm": 8.026153564453125, "learning_rate": 4.3552631578947375e-06, "loss": 0.9902, "step": 345 }, { "epoch": 0.33045977011494254, "loss_full_dim": 0.41554251313209534, "loss_main": 0.8557497262954712, "loss_parscale": 0.8671875, "loss_sub_dim": 0.44020718336105347, "loss_vclub": 0.000606536865234375, "parscale_sim": 0.984375, "step": 345 }, { "epoch": 0.3314176245210728, "grad_norm": 9.12739086151123, "learning_rate": 4.352631578947369e-06, "loss": 0.8557, "step": 346 }, { "epoch": 0.3314176245210728, "loss_full_dim": 0.43887460231781006, "loss_main": 0.8970842957496643, "loss_parscale": 0.89453125, "loss_sub_dim": 0.45820969343185425, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.9921875, "step": 346 }, { "epoch": 0.33237547892720304, "grad_norm": 8.224167823791504, "learning_rate": 4.350000000000001e-06, "loss": 0.8971, "step": 347 }, { "epoch": 0.33237547892720304, "loss_full_dim": 0.48896247148513794, "loss_main": 1.0034961700439453, "loss_parscale": 0.99609375, "loss_sub_dim": 0.5145336389541626, "loss_vclub": 0.000637054443359375, "parscale_sim": 0.984375, "step": 347 }, { "epoch": 0.3333333333333333, "grad_norm": 10.101871490478516, "learning_rate": 4.347368421052632e-06, "loss": 1.0035, "step": 348 }, { "epoch": 0.3333333333333333, "loss_full_dim": 0.395991712808609, "loss_main": 0.8110753297805786, "loss_parscale": 0.8125, "loss_sub_dim": 0.415083646774292, "loss_vclub": 0.000576019287109375, "parscale_sim": 0.9921875, "step": 348 }, { "epoch": 0.3342911877394636, "grad_norm": 8.981754302978516, "learning_rate": 4.344736842105263e-06, "loss": 0.8111, "step": 349 }, { "epoch": 0.3342911877394636, "loss_full_dim": 0.4395950138568878, "loss_main": 0.8986459970474243, "loss_parscale": 0.9140625, "loss_sub_dim": 0.4590510129928589, "loss_vclub": 0.00051116943359375, "parscale_sim": 0.98828125, "step": 349 }, { "epoch": 0.33524904214559387, "grad_norm": 9.983348846435547, "learning_rate": 4.342105263157895e-06, "loss": 0.8986, "step": 350 }, { "epoch": 0.33524904214559387, "loss_full_dim": 0.47637879848480225, "loss_main": 0.974756121635437, "loss_parscale": 0.9765625, "loss_sub_dim": 0.49837735295295715, "loss_vclub": 0.000537872314453125, "parscale_sim": 0.98828125, "step": 350 }, { "epoch": 0.33620689655172414, "grad_norm": 10.479521751403809, "learning_rate": 4.339473684210527e-06, "loss": 0.9748, "step": 351 }, { "epoch": 0.33620689655172414, "loss_full_dim": 0.42699483036994934, "loss_main": 0.8739281296730042, "loss_parscale": 0.875, "loss_sub_dim": 0.4469332993030548, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.98828125, "step": 351 }, { "epoch": 0.3371647509578544, "grad_norm": 15.09753704071045, "learning_rate": 4.336842105263158e-06, "loss": 0.8739, "step": 352 }, { "epoch": 0.3371647509578544, "loss_full_dim": 0.4770442843437195, "loss_main": 0.9741792678833008, "loss_parscale": 0.9765625, "loss_sub_dim": 0.4971349537372589, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.98828125, "step": 352 }, { "epoch": 0.3381226053639847, "grad_norm": 8.378952026367188, "learning_rate": 4.334210526315789e-06, "loss": 0.9742, "step": 353 }, { "epoch": 0.3381226053639847, "loss_full_dim": 0.4641458988189697, "loss_main": 0.948350727558136, "loss_parscale": 0.953125, "loss_sub_dim": 0.48420482873916626, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98828125, "step": 353 }, { "epoch": 0.3390804597701149, "grad_norm": 8.742182731628418, "learning_rate": 4.331578947368421e-06, "loss": 0.9484, "step": 354 }, { "epoch": 0.3390804597701149, "loss_full_dim": 0.424886018037796, "loss_main": 0.8712066411972046, "loss_parscale": 0.8828125, "loss_sub_dim": 0.4463205933570862, "loss_vclub": 0.0006256103515625, "parscale_sim": 0.98828125, "step": 354 }, { "epoch": 0.3400383141762452, "grad_norm": 9.117094039916992, "learning_rate": 4.328947368421053e-06, "loss": 0.8712, "step": 355 }, { "epoch": 0.3400383141762452, "loss_full_dim": 0.46518537402153015, "loss_main": 0.9489305019378662, "loss_parscale": 0.9375, "loss_sub_dim": 0.48374509811401367, "loss_vclub": 0.00054168701171875, "parscale_sim": 0.984375, "step": 355 }, { "epoch": 0.34099616858237547, "grad_norm": 8.116683959960938, "learning_rate": 4.3263157894736845e-06, "loss": 0.9489, "step": 356 }, { "epoch": 0.34099616858237547, "loss_full_dim": 0.5319132804870605, "loss_main": 1.0848009586334229, "loss_parscale": 1.078125, "loss_sub_dim": 0.5528876781463623, "loss_vclub": 0.00061798095703125, "parscale_sim": 0.9921875, "step": 356 }, { "epoch": 0.34195402298850575, "grad_norm": 9.231797218322754, "learning_rate": 4.323684210526316e-06, "loss": 1.0848, "step": 357 }, { "epoch": 0.34195402298850575, "loss_full_dim": 0.41470542550086975, "loss_main": 0.8473281860351562, "loss_parscale": 0.84375, "loss_sub_dim": 0.4326227605342865, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.9765625, "step": 357 }, { "epoch": 0.342911877394636, "grad_norm": 6.951185703277588, "learning_rate": 4.321052631578948e-06, "loss": 0.8473, "step": 358 }, { "epoch": 0.342911877394636, "loss_full_dim": 0.46515679359436035, "loss_main": 0.9481095671653748, "loss_parscale": 0.94140625, "loss_sub_dim": 0.4829527735710144, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.98828125, "step": 358 }, { "epoch": 0.3438697318007663, "grad_norm": 9.592046737670898, "learning_rate": 4.31842105263158e-06, "loss": 0.9481, "step": 359 }, { "epoch": 0.3438697318007663, "loss_full_dim": 0.4256281852722168, "loss_main": 0.8712435960769653, "loss_parscale": 0.875, "loss_sub_dim": 0.44561541080474854, "loss_vclub": 0.000530242919921875, "parscale_sim": 0.9921875, "step": 359 }, { "epoch": 0.3448275862068966, "grad_norm": 10.603206634521484, "learning_rate": 4.315789473684211e-06, "loss": 0.8712, "step": 360 }, { "epoch": 0.3448275862068966, "loss_full_dim": 0.41809600591659546, "loss_main": 0.8581884503364563, "loss_parscale": 0.85546875, "loss_sub_dim": 0.44009244441986084, "loss_vclub": 0.000499725341796875, "parscale_sim": 0.98828125, "step": 360 }, { "epoch": 0.3457854406130268, "grad_norm": 7.395258903503418, "learning_rate": 4.313157894736843e-06, "loss": 0.8582, "step": 361 }, { "epoch": 0.3457854406130268, "loss_full_dim": 0.4542994797229767, "loss_main": 0.9277842044830322, "loss_parscale": 0.9375, "loss_sub_dim": 0.47348475456237793, "loss_vclub": 0.00060272216796875, "parscale_sim": 0.984375, "step": 361 }, { "epoch": 0.34674329501915707, "grad_norm": 10.307706832885742, "learning_rate": 4.310526315789474e-06, "loss": 0.9278, "step": 362 }, { "epoch": 0.34674329501915707, "loss_full_dim": 0.43102768063545227, "loss_main": 0.8809823989868164, "loss_parscale": 0.8828125, "loss_sub_dim": 0.44995471835136414, "loss_vclub": 0.000614166259765625, "parscale_sim": 0.9765625, "step": 362 }, { "epoch": 0.34770114942528735, "grad_norm": 7.263495922088623, "learning_rate": 4.307894736842105e-06, "loss": 0.881, "step": 363 }, { "epoch": 0.34770114942528735, "loss_full_dim": 0.40863919258117676, "loss_main": 0.8376893997192383, "loss_parscale": 0.84375, "loss_sub_dim": 0.4290502071380615, "loss_vclub": 0.00060272216796875, "parscale_sim": 0.9921875, "step": 363 }, { "epoch": 0.3486590038314176, "grad_norm": 9.277572631835938, "learning_rate": 4.305263157894737e-06, "loss": 0.8377, "step": 364 }, { "epoch": 0.3486590038314176, "loss_full_dim": 0.44653794169425964, "loss_main": 0.9134308099746704, "loss_parscale": 0.91796875, "loss_sub_dim": 0.4668928384780884, "loss_vclub": 0.000621795654296875, "parscale_sim": 0.98828125, "step": 364 }, { "epoch": 0.3496168582375479, "grad_norm": 7.496508598327637, "learning_rate": 4.302631578947369e-06, "loss": 0.9134, "step": 365 }, { "epoch": 0.3496168582375479, "loss_full_dim": 0.4775778651237488, "loss_main": 0.9779017567634583, "loss_parscale": 0.98828125, "loss_sub_dim": 0.5003238916397095, "loss_vclub": 0.0005950927734375, "parscale_sim": 0.9921875, "step": 365 }, { "epoch": 0.3505747126436782, "grad_norm": 13.275524139404297, "learning_rate": 4.3e-06, "loss": 0.9779, "step": 366 }, { "epoch": 0.3505747126436782, "loss_full_dim": 0.39808300137519836, "loss_main": 0.8161699175834656, "loss_parscale": 0.8203125, "loss_sub_dim": 0.4180869162082672, "loss_vclub": 0.000579833984375, "parscale_sim": 0.98828125, "step": 366 }, { "epoch": 0.35153256704980845, "grad_norm": 8.871745109558105, "learning_rate": 4.2973684210526315e-06, "loss": 0.8162, "step": 367 }, { "epoch": 0.35153256704980845, "loss_full_dim": 0.46687382459640503, "loss_main": 0.9577904939651489, "loss_parscale": 0.9765625, "loss_sub_dim": 0.4909166395664215, "loss_vclub": 0.000579833984375, "parscale_sim": 0.98828125, "step": 367 }, { "epoch": 0.3524904214559387, "grad_norm": 12.953768730163574, "learning_rate": 4.2947368421052635e-06, "loss": 0.9578, "step": 368 }, { "epoch": 0.3524904214559387, "loss_full_dim": 0.41924482583999634, "loss_main": 0.8588818311691284, "loss_parscale": 0.86328125, "loss_sub_dim": 0.4396369755268097, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.9921875, "step": 368 }, { "epoch": 0.35344827586206895, "grad_norm": 8.196922302246094, "learning_rate": 4.2921052631578955e-06, "loss": 0.8589, "step": 369 }, { "epoch": 0.35344827586206895, "loss_full_dim": 0.488022118806839, "loss_main": 1.0008009672164917, "loss_parscale": 1.015625, "loss_sub_dim": 0.5127788782119751, "loss_vclub": 0.00061798095703125, "parscale_sim": 0.98828125, "step": 369 }, { "epoch": 0.3544061302681992, "grad_norm": 16.164655685424805, "learning_rate": 4.289473684210527e-06, "loss": 1.0008, "step": 370 }, { "epoch": 0.3544061302681992, "loss_full_dim": 0.5364131927490234, "loss_main": 1.0960534811019897, "loss_parscale": 1.078125, "loss_sub_dim": 0.5596402883529663, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.9921875, "step": 370 }, { "epoch": 0.3553639846743295, "grad_norm": 9.01752758026123, "learning_rate": 4.286842105263158e-06, "loss": 1.0961, "step": 371 }, { "epoch": 0.3553639846743295, "loss_full_dim": 0.5138240456581116, "loss_main": 1.049748182296753, "loss_parscale": 1.0625, "loss_sub_dim": 0.5359241366386414, "loss_vclub": 0.00067138671875, "parscale_sim": 0.9921875, "step": 371 }, { "epoch": 0.3563218390804598, "grad_norm": 10.446864128112793, "learning_rate": 4.28421052631579e-06, "loss": 1.0497, "step": 372 }, { "epoch": 0.3563218390804598, "loss_full_dim": 0.4551287293434143, "loss_main": 0.9304155111312866, "loss_parscale": 0.9375, "loss_sub_dim": 0.4752867519855499, "loss_vclub": 0.000682830810546875, "parscale_sim": 0.98828125, "step": 372 }, { "epoch": 0.35727969348659006, "grad_norm": 6.715888500213623, "learning_rate": 4.281578947368422e-06, "loss": 0.9304, "step": 373 }, { "epoch": 0.35727969348659006, "loss_full_dim": 0.44249802827835083, "loss_main": 0.9048665761947632, "loss_parscale": 0.9140625, "loss_sub_dim": 0.46236851811408997, "loss_vclub": 0.000644683837890625, "parscale_sim": 0.9921875, "step": 373 }, { "epoch": 0.35823754789272033, "grad_norm": 7.155416011810303, "learning_rate": 4.278947368421053e-06, "loss": 0.9049, "step": 374 }, { "epoch": 0.35823754789272033, "loss_full_dim": 0.46881458163261414, "loss_main": 0.9577963948249817, "loss_parscale": 0.9609375, "loss_sub_dim": 0.48898181319236755, "loss_vclub": 0.000659942626953125, "parscale_sim": 0.9921875, "step": 374 }, { "epoch": 0.35919540229885055, "grad_norm": 10.761484146118164, "learning_rate": 4.276315789473684e-06, "loss": 0.9578, "step": 375 }, { "epoch": 0.35919540229885055, "loss_full_dim": 0.4871046841144562, "loss_main": 0.9967273473739624, "loss_parscale": 1.0, "loss_sub_dim": 0.5096226930618286, "loss_vclub": 0.000568389892578125, "parscale_sim": 0.9921875, "step": 375 }, { "epoch": 0.36015325670498083, "grad_norm": 8.725781440734863, "learning_rate": 4.273684210526316e-06, "loss": 0.9967, "step": 376 }, { "epoch": 0.36015325670498083, "loss_full_dim": 0.44209709763526917, "loss_main": 0.9052878618240356, "loss_parscale": 0.90234375, "loss_sub_dim": 0.4631907343864441, "loss_vclub": 0.000759124755859375, "parscale_sim": 0.98828125, "step": 376 }, { "epoch": 0.3611111111111111, "grad_norm": 8.18521785736084, "learning_rate": 4.271052631578947e-06, "loss": 0.9053, "step": 377 }, { "epoch": 0.3611111111111111, "loss_full_dim": 0.43272846937179565, "loss_main": 0.8858870267868042, "loss_parscale": 0.890625, "loss_sub_dim": 0.45315852761268616, "loss_vclub": 0.0004673004150390625, "parscale_sim": 0.984375, "step": 377 }, { "epoch": 0.3620689655172414, "grad_norm": 7.5024919509887695, "learning_rate": 4.268421052631579e-06, "loss": 0.8859, "step": 378 }, { "epoch": 0.3620689655172414, "loss_full_dim": 0.453589528799057, "loss_main": 0.9275256395339966, "loss_parscale": 0.9375, "loss_sub_dim": 0.4739360809326172, "loss_vclub": 0.000606536865234375, "parscale_sim": 0.98828125, "step": 378 }, { "epoch": 0.36302681992337166, "grad_norm": 10.00794506072998, "learning_rate": 4.265789473684211e-06, "loss": 0.9275, "step": 379 }, { "epoch": 0.36302681992337166, "loss_full_dim": 0.4871354103088379, "loss_main": 0.9936972856521606, "loss_parscale": 0.984375, "loss_sub_dim": 0.5065618753433228, "loss_vclub": 0.000598907470703125, "parscale_sim": 0.98828125, "step": 379 }, { "epoch": 0.36398467432950193, "grad_norm": 47.017181396484375, "learning_rate": 4.2631578947368425e-06, "loss": 0.9937, "step": 380 }, { "epoch": 0.36398467432950193, "loss_full_dim": 0.39208078384399414, "loss_main": 0.8036899566650391, "loss_parscale": 0.8125, "loss_sub_dim": 0.4116091728210449, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.98828125, "step": 380 }, { "epoch": 0.3649425287356322, "grad_norm": 8.05971908569336, "learning_rate": 4.260526315789474e-06, "loss": 0.8037, "step": 381 }, { "epoch": 0.3649425287356322, "loss_full_dim": 0.42800793051719666, "loss_main": 0.8761366009712219, "loss_parscale": 0.87890625, "loss_sub_dim": 0.44812867045402527, "loss_vclub": 0.000640869140625, "parscale_sim": 0.98828125, "step": 381 }, { "epoch": 0.36590038314176243, "grad_norm": 12.850507736206055, "learning_rate": 4.257894736842106e-06, "loss": 0.8761, "step": 382 }, { "epoch": 0.36590038314176243, "loss_full_dim": 0.47891175746917725, "loss_main": 0.9779064655303955, "loss_parscale": 0.984375, "loss_sub_dim": 0.49899470806121826, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.984375, "step": 382 }, { "epoch": 0.3668582375478927, "grad_norm": 8.173101425170898, "learning_rate": 4.255263157894738e-06, "loss": 0.9779, "step": 383 }, { "epoch": 0.3668582375478927, "loss_full_dim": 0.47503119707107544, "loss_main": 0.970728874206543, "loss_parscale": 0.96484375, "loss_sub_dim": 0.49569764733314514, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.98828125, "step": 383 }, { "epoch": 0.367816091954023, "grad_norm": 10.01792049407959, "learning_rate": 4.252631578947369e-06, "loss": 0.9707, "step": 384 }, { "epoch": 0.367816091954023, "loss_full_dim": 0.45604366064071655, "loss_main": 0.930018961429596, "loss_parscale": 0.9296875, "loss_sub_dim": 0.4739753007888794, "loss_vclub": 0.00067138671875, "parscale_sim": 0.9921875, "step": 384 }, { "epoch": 0.36877394636015326, "grad_norm": 13.419453620910645, "learning_rate": 4.25e-06, "loss": 0.93, "step": 385 }, { "epoch": 0.36877394636015326, "loss_full_dim": 0.4245266318321228, "loss_main": 0.8682953119277954, "loss_parscale": 0.875, "loss_sub_dim": 0.443768709897995, "loss_vclub": 0.000640869140625, "parscale_sim": 0.98828125, "step": 385 }, { "epoch": 0.36973180076628354, "grad_norm": 6.336372375488281, "learning_rate": 4.247368421052632e-06, "loss": 0.8683, "step": 386 }, { "epoch": 0.36973180076628354, "loss_full_dim": 0.3766653835773468, "loss_main": 0.7727830410003662, "loss_parscale": 0.7734375, "loss_sub_dim": 0.396117627620697, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.9921875, "step": 386 }, { "epoch": 0.3706896551724138, "grad_norm": 9.738414764404297, "learning_rate": 4.244736842105264e-06, "loss": 0.7728, "step": 387 }, { "epoch": 0.3706896551724138, "loss_full_dim": 0.4266118109226227, "loss_main": 0.8726050853729248, "loss_parscale": 0.87109375, "loss_sub_dim": 0.4459933042526245, "loss_vclub": 0.0005645751953125, "parscale_sim": 0.9921875, "step": 387 }, { "epoch": 0.3716475095785441, "grad_norm": 11.579068183898926, "learning_rate": 4.242105263157895e-06, "loss": 0.8726, "step": 388 }, { "epoch": 0.3716475095785441, "loss_full_dim": 0.4382663071155548, "loss_main": 0.8927673101425171, "loss_parscale": 0.8984375, "loss_sub_dim": 0.4545009732246399, "loss_vclub": 0.0006256103515625, "parscale_sim": 0.984375, "step": 388 }, { "epoch": 0.3726053639846743, "grad_norm": 10.872875213623047, "learning_rate": 4.239473684210526e-06, "loss": 0.8928, "step": 389 }, { "epoch": 0.3726053639846743, "loss_full_dim": 0.41800636053085327, "loss_main": 0.8579092025756836, "loss_parscale": 0.859375, "loss_sub_dim": 0.43990281224250793, "loss_vclub": 0.000583648681640625, "parscale_sim": 0.9921875, "step": 389 }, { "epoch": 0.3735632183908046, "grad_norm": 7.820930480957031, "learning_rate": 4.236842105263158e-06, "loss": 0.8579, "step": 390 }, { "epoch": 0.3735632183908046, "loss_full_dim": 0.4402148127555847, "loss_main": 0.9017785787582397, "loss_parscale": 0.90234375, "loss_sub_dim": 0.4615637958049774, "loss_vclub": 0.0006256103515625, "parscale_sim": 0.9921875, "step": 390 }, { "epoch": 0.37452107279693486, "grad_norm": 7.109933853149414, "learning_rate": 4.2342105263157895e-06, "loss": 0.9018, "step": 391 }, { "epoch": 0.37452107279693486, "loss_full_dim": 0.4472580850124359, "loss_main": 0.914267361164093, "loss_parscale": 0.9140625, "loss_sub_dim": 0.4670092761516571, "loss_vclub": 0.000743865966796875, "parscale_sim": 0.98828125, "step": 391 }, { "epoch": 0.37547892720306514, "grad_norm": 7.019252777099609, "learning_rate": 4.2315789473684215e-06, "loss": 0.9143, "step": 392 }, { "epoch": 0.37547892720306514, "loss_full_dim": 0.5165498852729797, "loss_main": 1.0549190044403076, "loss_parscale": 1.0546875, "loss_sub_dim": 0.5383691787719727, "loss_vclub": 0.000759124755859375, "parscale_sim": 0.984375, "step": 392 }, { "epoch": 0.3764367816091954, "grad_norm": 8.488003730773926, "learning_rate": 4.228947368421053e-06, "loss": 1.0549, "step": 393 }, { "epoch": 0.3764367816091954, "loss_full_dim": 0.4624643623828888, "loss_main": 0.9448226690292358, "loss_parscale": 0.94921875, "loss_sub_dim": 0.48235827684402466, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.9921875, "step": 393 }, { "epoch": 0.3773946360153257, "grad_norm": 8.930899620056152, "learning_rate": 4.226315789473685e-06, "loss": 0.9448, "step": 394 }, { "epoch": 0.3773946360153257, "loss_full_dim": 0.39840689301490784, "loss_main": 0.8180058598518372, "loss_parscale": 0.80859375, "loss_sub_dim": 0.4195989668369293, "loss_vclub": 0.000560760498046875, "parscale_sim": 0.9921875, "step": 394 }, { "epoch": 0.3783524904214559, "grad_norm": 8.104022979736328, "learning_rate": 4.223684210526316e-06, "loss": 0.818, "step": 395 }, { "epoch": 0.3783524904214559, "loss_full_dim": 0.45102015137672424, "loss_main": 0.9195668697357178, "loss_parscale": 0.91796875, "loss_sub_dim": 0.46854668855667114, "loss_vclub": 0.0006103515625, "parscale_sim": 0.9765625, "step": 395 }, { "epoch": 0.3793103448275862, "grad_norm": 25.2667236328125, "learning_rate": 4.221052631578948e-06, "loss": 0.9196, "step": 396 }, { "epoch": 0.3793103448275862, "loss_full_dim": 0.42921626567840576, "loss_main": 0.8800885677337646, "loss_parscale": 0.875, "loss_sub_dim": 0.4508723020553589, "loss_vclub": 0.000537872314453125, "parscale_sim": 0.98828125, "step": 396 }, { "epoch": 0.38026819923371646, "grad_norm": 10.440531730651855, "learning_rate": 4.21842105263158e-06, "loss": 0.8801, "step": 397 }, { "epoch": 0.38026819923371646, "loss_full_dim": 0.48641645908355713, "loss_main": 0.9938787221908569, "loss_parscale": 1.0, "loss_sub_dim": 0.5074622631072998, "loss_vclub": 0.00067138671875, "parscale_sim": 0.98828125, "step": 397 }, { "epoch": 0.38122605363984674, "grad_norm": 32.24504470825195, "learning_rate": 4.215789473684211e-06, "loss": 0.9939, "step": 398 }, { "epoch": 0.38122605363984674, "loss_full_dim": 0.49735504388809204, "loss_main": 1.017209768295288, "loss_parscale": 1.0234375, "loss_sub_dim": 0.5198546648025513, "loss_vclub": 0.000579833984375, "parscale_sim": 0.98828125, "step": 398 }, { "epoch": 0.382183908045977, "grad_norm": 9.464401245117188, "learning_rate": 4.213157894736842e-06, "loss": 1.0172, "step": 399 }, { "epoch": 0.382183908045977, "loss_full_dim": 0.4742211699485779, "loss_main": 0.9715732336044312, "loss_parscale": 0.9765625, "loss_sub_dim": 0.49735209345817566, "loss_vclub": 0.000705718994140625, "parscale_sim": 0.98828125, "step": 399 }, { "epoch": 0.3831417624521073, "grad_norm": 8.733227729797363, "learning_rate": 4.210526315789474e-06, "loss": 0.9716, "step": 400 }, { "epoch": 0.3831417624521073, "loss_full_dim": 0.38726890087127686, "loss_main": 0.7930299043655396, "loss_parscale": 0.8046875, "loss_sub_dim": 0.4057610034942627, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.98828125, "step": 400 }, { "epoch": 0.38409961685823757, "grad_norm": 8.816071510314941, "learning_rate": 4.207894736842106e-06, "loss": 0.793, "step": 401 }, { "epoch": 0.38409961685823757, "loss_full_dim": 0.44987088441848755, "loss_main": 0.9236364364624023, "loss_parscale": 0.9296875, "loss_sub_dim": 0.4737655222415924, "loss_vclub": 0.00061798095703125, "parscale_sim": 0.98828125, "step": 401 }, { "epoch": 0.3850574712643678, "grad_norm": 10.076164245605469, "learning_rate": 4.205263157894737e-06, "loss": 0.9236, "step": 402 }, { "epoch": 0.3850574712643678, "loss_full_dim": 0.46317151188850403, "loss_main": 0.9449728727340698, "loss_parscale": 0.9609375, "loss_sub_dim": 0.4818013906478882, "loss_vclub": 0.00060272216796875, "parscale_sim": 0.98046875, "step": 402 }, { "epoch": 0.38601532567049807, "grad_norm": 7.368901252746582, "learning_rate": 4.2026315789473684e-06, "loss": 0.945, "step": 403 }, { "epoch": 0.38601532567049807, "loss_full_dim": 0.4223281741142273, "loss_main": 0.8634780645370483, "loss_parscale": 0.859375, "loss_sub_dim": 0.44114986062049866, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.98828125, "step": 403 }, { "epoch": 0.38697318007662834, "grad_norm": 8.625066757202148, "learning_rate": 4.2000000000000004e-06, "loss": 0.8635, "step": 404 }, { "epoch": 0.38697318007662834, "loss_full_dim": 0.34953805804252625, "loss_main": 0.7144157886505127, "loss_parscale": 0.71875, "loss_sub_dim": 0.36487776041030884, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.9921875, "step": 404 }, { "epoch": 0.3879310344827586, "grad_norm": 8.694732666015625, "learning_rate": 4.197368421052632e-06, "loss": 0.7144, "step": 405 }, { "epoch": 0.3879310344827586, "loss_full_dim": 0.4281255304813385, "loss_main": 0.8749062418937683, "loss_parscale": 0.87890625, "loss_sub_dim": 0.4467807114124298, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.9921875, "step": 405 }, { "epoch": 0.3888888888888889, "grad_norm": 55.68412780761719, "learning_rate": 4.194736842105264e-06, "loss": 0.8749, "step": 406 }, { "epoch": 0.3888888888888889, "loss_full_dim": 0.46113306283950806, "loss_main": 0.9421705603599548, "loss_parscale": 0.9296875, "loss_sub_dim": 0.4810374975204468, "loss_vclub": 0.0006256103515625, "parscale_sim": 0.9921875, "step": 406 }, { "epoch": 0.38984674329501917, "grad_norm": 8.849422454833984, "learning_rate": 4.192105263157895e-06, "loss": 0.9422, "step": 407 }, { "epoch": 0.38984674329501917, "loss_full_dim": 0.46497395634651184, "loss_main": 0.9507193565368652, "loss_parscale": 0.953125, "loss_sub_dim": 0.4857454299926758, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.98828125, "step": 407 }, { "epoch": 0.39080459770114945, "grad_norm": 6.725809574127197, "learning_rate": 4.189473684210527e-06, "loss": 0.9507, "step": 408 }, { "epoch": 0.39080459770114945, "loss_full_dim": 0.3681986331939697, "loss_main": 0.7572967410087585, "loss_parscale": 0.76171875, "loss_sub_dim": 0.3890981078147888, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.98828125, "step": 408 }, { "epoch": 0.39176245210727967, "grad_norm": 9.150272369384766, "learning_rate": 4.186842105263158e-06, "loss": 0.7573, "step": 409 }, { "epoch": 0.39176245210727967, "loss_full_dim": 0.42353689670562744, "loss_main": 0.8663000464439392, "loss_parscale": 0.8671875, "loss_sub_dim": 0.44276314973831177, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.98828125, "step": 409 }, { "epoch": 0.39272030651340994, "grad_norm": 8.678020477294922, "learning_rate": 4.18421052631579e-06, "loss": 0.8663, "step": 410 }, { "epoch": 0.39272030651340994, "loss_full_dim": 0.3692479729652405, "loss_main": 0.7559953927993774, "loss_parscale": 0.765625, "loss_sub_dim": 0.3867473900318146, "loss_vclub": 0.0005645751953125, "parscale_sim": 0.9921875, "step": 410 }, { "epoch": 0.3936781609195402, "grad_norm": 12.922295570373535, "learning_rate": 4.181578947368421e-06, "loss": 0.756, "step": 411 }, { "epoch": 0.3936781609195402, "loss_full_dim": 0.44260373711586, "loss_main": 0.9042131900787354, "loss_parscale": 0.90625, "loss_sub_dim": 0.461609423160553, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.98828125, "step": 411 }, { "epoch": 0.3946360153256705, "grad_norm": 7.890651226043701, "learning_rate": 4.178947368421053e-06, "loss": 0.9042, "step": 412 }, { "epoch": 0.3946360153256705, "loss_full_dim": 0.351467490196228, "loss_main": 0.7223517298698425, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3708842396736145, "loss_vclub": 0.0006103515625, "parscale_sim": 0.9921875, "step": 412 }, { "epoch": 0.3955938697318008, "grad_norm": 30.422536849975586, "learning_rate": 4.176315789473684e-06, "loss": 0.7224, "step": 413 }, { "epoch": 0.3955938697318008, "loss_full_dim": 0.4424351155757904, "loss_main": 0.9012370109558105, "loss_parscale": 0.91015625, "loss_sub_dim": 0.45880192518234253, "loss_vclub": 0.000518798828125, "parscale_sim": 0.9921875, "step": 413 }, { "epoch": 0.39655172413793105, "grad_norm": 7.523470401763916, "learning_rate": 4.173684210526316e-06, "loss": 0.9012, "step": 414 }, { "epoch": 0.39655172413793105, "loss_full_dim": 0.39484572410583496, "loss_main": 0.8078362345695496, "loss_parscale": 0.81640625, "loss_sub_dim": 0.4129905104637146, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.9921875, "step": 414 }, { "epoch": 0.3975095785440613, "grad_norm": 9.134872436523438, "learning_rate": 4.171052631578948e-06, "loss": 0.8078, "step": 415 }, { "epoch": 0.3975095785440613, "loss_full_dim": 0.4514067769050598, "loss_main": 0.9243760108947754, "loss_parscale": 0.9296875, "loss_sub_dim": 0.4729692041873932, "loss_vclub": 0.00052642822265625, "parscale_sim": 0.9921875, "step": 415 }, { "epoch": 0.39846743295019155, "grad_norm": 7.524125099182129, "learning_rate": 4.1684210526315794e-06, "loss": 0.9244, "step": 416 }, { "epoch": 0.39846743295019155, "loss_full_dim": 0.4031737744808197, "loss_main": 0.8247092366218567, "loss_parscale": 0.8203125, "loss_sub_dim": 0.421535462141037, "loss_vclub": 0.00064849853515625, "parscale_sim": 0.98828125, "step": 416 }, { "epoch": 0.3994252873563218, "grad_norm": 8.898538589477539, "learning_rate": 4.165789473684211e-06, "loss": 0.8247, "step": 417 }, { "epoch": 0.3994252873563218, "loss_full_dim": 0.42805707454681396, "loss_main": 0.8755141496658325, "loss_parscale": 0.875, "loss_sub_dim": 0.44745710492134094, "loss_vclub": 0.000762939453125, "parscale_sim": 0.9921875, "step": 417 }, { "epoch": 0.4003831417624521, "grad_norm": 8.301877975463867, "learning_rate": 4.163157894736843e-06, "loss": 0.8755, "step": 418 }, { "epoch": 0.4003831417624521, "loss_full_dim": 0.3859550356864929, "loss_main": 0.7887036800384521, "loss_parscale": 0.80859375, "loss_sub_dim": 0.40274861454963684, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.98828125, "step": 418 }, { "epoch": 0.4013409961685824, "grad_norm": 7.985762119293213, "learning_rate": 4.160526315789475e-06, "loss": 0.7887, "step": 419 }, { "epoch": 0.4013409961685824, "loss_full_dim": 0.4175320565700531, "loss_main": 0.8516582250595093, "loss_parscale": 0.84375, "loss_sub_dim": 0.43412619829177856, "loss_vclub": 0.00055694580078125, "parscale_sim": 0.98828125, "step": 419 }, { "epoch": 0.40229885057471265, "grad_norm": 8.507913589477539, "learning_rate": 4.157894736842106e-06, "loss": 0.8517, "step": 420 }, { "epoch": 0.40229885057471265, "loss_full_dim": 0.4271259307861328, "loss_main": 0.8739840984344482, "loss_parscale": 0.8828125, "loss_sub_dim": 0.44685816764831543, "loss_vclub": 0.00064849853515625, "parscale_sim": 0.9921875, "step": 420 }, { "epoch": 0.40325670498084293, "grad_norm": 12.049805641174316, "learning_rate": 4.155263157894737e-06, "loss": 0.874, "step": 421 }, { "epoch": 0.40325670498084293, "loss_full_dim": 0.41078197956085205, "loss_main": 0.8419060111045837, "loss_parscale": 0.85546875, "loss_sub_dim": 0.4311240315437317, "loss_vclub": 0.000732421875, "parscale_sim": 0.98828125, "step": 421 }, { "epoch": 0.4042145593869732, "grad_norm": 13.00418758392334, "learning_rate": 4.152631578947369e-06, "loss": 0.8419, "step": 422 }, { "epoch": 0.4042145593869732, "loss_full_dim": 0.47750595211982727, "loss_main": 0.975269615650177, "loss_parscale": 0.9765625, "loss_sub_dim": 0.49776366353034973, "loss_vclub": 0.000690460205078125, "parscale_sim": 0.98828125, "step": 422 }, { "epoch": 0.4051724137931034, "grad_norm": 9.63241195678711, "learning_rate": 4.15e-06, "loss": 0.9753, "step": 423 }, { "epoch": 0.4051724137931034, "loss_full_dim": 0.4209142029285431, "loss_main": 0.860163688659668, "loss_parscale": 0.859375, "loss_sub_dim": 0.4392494559288025, "loss_vclub": 0.00054168701171875, "parscale_sim": 0.9921875, "step": 423 }, { "epoch": 0.4061302681992337, "grad_norm": 7.401691913604736, "learning_rate": 4.147368421052632e-06, "loss": 0.8602, "step": 424 }, { "epoch": 0.4061302681992337, "loss_full_dim": 0.37909260392189026, "loss_main": 0.7777637243270874, "loss_parscale": 0.765625, "loss_sub_dim": 0.39867109060287476, "loss_vclub": 0.000713348388671875, "parscale_sim": 0.98828125, "step": 424 }, { "epoch": 0.407088122605364, "grad_norm": 8.016939163208008, "learning_rate": 4.144736842105263e-06, "loss": 0.7778, "step": 425 }, { "epoch": 0.407088122605364, "loss_full_dim": 0.40696749091148376, "loss_main": 0.8329364061355591, "loss_parscale": 0.8359375, "loss_sub_dim": 0.4259689450263977, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.9921875, "step": 425 }, { "epoch": 0.40804597701149425, "grad_norm": 8.027145385742188, "learning_rate": 4.142105263157895e-06, "loss": 0.8329, "step": 426 }, { "epoch": 0.40804597701149425, "loss_full_dim": 0.3948684334754944, "loss_main": 0.8108862042427063, "loss_parscale": 0.796875, "loss_sub_dim": 0.4160177707672119, "loss_vclub": 0.00057220458984375, "parscale_sim": 0.9921875, "step": 426 }, { "epoch": 0.40900383141762453, "grad_norm": 6.602686882019043, "learning_rate": 4.139473684210526e-06, "loss": 0.8109, "step": 427 }, { "epoch": 0.40900383141762453, "loss_full_dim": 0.46957600116729736, "loss_main": 0.9597362279891968, "loss_parscale": 0.9609375, "loss_sub_dim": 0.4901602566242218, "loss_vclub": 0.000705718994140625, "parscale_sim": 0.98828125, "step": 427 }, { "epoch": 0.4099616858237548, "grad_norm": 9.147735595703125, "learning_rate": 4.136842105263158e-06, "loss": 0.9597, "step": 428 }, { "epoch": 0.4099616858237548, "loss_full_dim": 0.5110257267951965, "loss_main": 1.046844720840454, "loss_parscale": 1.046875, "loss_sub_dim": 0.5358189344406128, "loss_vclub": 0.00054931640625, "parscale_sim": 0.9765625, "step": 428 }, { "epoch": 0.4109195402298851, "grad_norm": 8.399147987365723, "learning_rate": 4.13421052631579e-06, "loss": 1.0468, "step": 429 }, { "epoch": 0.4109195402298851, "loss_full_dim": 0.4294820725917816, "loss_main": 0.8787529468536377, "loss_parscale": 0.890625, "loss_sub_dim": 0.4492708742618561, "loss_vclub": 0.000553131103515625, "parscale_sim": 0.9921875, "step": 429 }, { "epoch": 0.4118773946360153, "grad_norm": 9.586782455444336, "learning_rate": 4.1315789473684216e-06, "loss": 0.8788, "step": 430 }, { "epoch": 0.4118773946360153, "loss_full_dim": 0.4109470844268799, "loss_main": 0.8431974649429321, "loss_parscale": 0.84765625, "loss_sub_dim": 0.43225035071372986, "loss_vclub": 0.000576019287109375, "parscale_sim": 0.984375, "step": 430 }, { "epoch": 0.4128352490421456, "grad_norm": 7.9171600341796875, "learning_rate": 4.128947368421053e-06, "loss": 0.8432, "step": 431 }, { "epoch": 0.4128352490421456, "loss_full_dim": 0.4313555955886841, "loss_main": 0.8831566572189331, "loss_parscale": 0.890625, "loss_sub_dim": 0.45180103182792664, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.98046875, "step": 431 }, { "epoch": 0.41379310344827586, "grad_norm": 9.842731475830078, "learning_rate": 4.126315789473685e-06, "loss": 0.8832, "step": 432 }, { "epoch": 0.41379310344827586, "loss_full_dim": 0.4196734130382538, "loss_main": 0.8560320138931274, "loss_parscale": 0.85546875, "loss_sub_dim": 0.43635860085487366, "loss_vclub": 0.000640869140625, "parscale_sim": 0.984375, "step": 432 }, { "epoch": 0.41475095785440613, "grad_norm": 8.481257438659668, "learning_rate": 4.123684210526317e-06, "loss": 0.856, "step": 433 }, { "epoch": 0.41475095785440613, "loss_full_dim": 0.44562849402427673, "loss_main": 0.9098720550537109, "loss_parscale": 0.90625, "loss_sub_dim": 0.4642435908317566, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.9921875, "step": 433 }, { "epoch": 0.4157088122605364, "grad_norm": 7.474489212036133, "learning_rate": 4.121052631578948e-06, "loss": 0.9099, "step": 434 }, { "epoch": 0.4157088122605364, "loss_full_dim": 0.44655001163482666, "loss_main": 0.9128831028938293, "loss_parscale": 0.9375, "loss_sub_dim": 0.4663330912590027, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.98828125, "step": 434 }, { "epoch": 0.4166666666666667, "grad_norm": 7.236392021179199, "learning_rate": 4.118421052631579e-06, "loss": 0.9129, "step": 435 }, { "epoch": 0.4166666666666667, "loss_full_dim": 0.4318729043006897, "loss_main": 0.8833335638046265, "loss_parscale": 0.8828125, "loss_sub_dim": 0.4514606297016144, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.9921875, "step": 435 }, { "epoch": 0.41762452107279696, "grad_norm": 7.802637100219727, "learning_rate": 4.115789473684211e-06, "loss": 0.8833, "step": 436 }, { "epoch": 0.41762452107279696, "loss_full_dim": 0.45306143164634705, "loss_main": 0.9268473386764526, "loss_parscale": 0.90625, "loss_sub_dim": 0.4737858772277832, "loss_vclub": 0.0006103515625, "parscale_sim": 0.98828125, "step": 436 }, { "epoch": 0.4185823754789272, "grad_norm": 6.234859466552734, "learning_rate": 4.113157894736842e-06, "loss": 0.9268, "step": 437 }, { "epoch": 0.4185823754789272, "loss_full_dim": 0.3628863990306854, "loss_main": 0.7432752847671509, "loss_parscale": 0.7421875, "loss_sub_dim": 0.38038885593414307, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.98828125, "step": 437 }, { "epoch": 0.41954022988505746, "grad_norm": 8.306745529174805, "learning_rate": 4.110526315789474e-06, "loss": 0.7433, "step": 438 }, { "epoch": 0.41954022988505746, "loss_full_dim": 0.37009820342063904, "loss_main": 0.7573850750923157, "loss_parscale": 0.77734375, "loss_sub_dim": 0.38728687167167664, "loss_vclub": 0.0005950927734375, "parscale_sim": 0.98828125, "step": 438 }, { "epoch": 0.42049808429118773, "grad_norm": 6.352539539337158, "learning_rate": 4.107894736842105e-06, "loss": 0.7574, "step": 439 }, { "epoch": 0.42049808429118773, "loss_full_dim": 0.40397515892982483, "loss_main": 0.824984073638916, "loss_parscale": 0.8203125, "loss_sub_dim": 0.4210089445114136, "loss_vclub": 0.0006256103515625, "parscale_sim": 0.98828125, "step": 439 }, { "epoch": 0.421455938697318, "grad_norm": 7.016097545623779, "learning_rate": 4.105263157894737e-06, "loss": 0.825, "step": 440 }, { "epoch": 0.421455938697318, "loss_full_dim": 0.42832428216934204, "loss_main": 0.8758153319358826, "loss_parscale": 0.87109375, "loss_sub_dim": 0.4474910497665405, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.9921875, "step": 440 }, { "epoch": 0.4224137931034483, "grad_norm": 6.557914733886719, "learning_rate": 4.1026315789473686e-06, "loss": 0.8758, "step": 441 }, { "epoch": 0.4224137931034483, "loss_full_dim": 0.39304715394973755, "loss_main": 0.8035370111465454, "loss_parscale": 0.82421875, "loss_sub_dim": 0.41048985719680786, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.98828125, "step": 441 }, { "epoch": 0.42337164750957856, "grad_norm": 8.088637351989746, "learning_rate": 4.1e-06, "loss": 0.8035, "step": 442 }, { "epoch": 0.42337164750957856, "loss_full_dim": 0.4163850247859955, "loss_main": 0.8534404039382935, "loss_parscale": 0.86328125, "loss_sub_dim": 0.43705540895462036, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.98828125, "step": 442 }, { "epoch": 0.42432950191570884, "grad_norm": 8.48879623413086, "learning_rate": 4.097368421052632e-06, "loss": 0.8534, "step": 443 }, { "epoch": 0.42432950191570884, "loss_full_dim": 0.36687418818473816, "loss_main": 0.7522403597831726, "loss_parscale": 0.7578125, "loss_sub_dim": 0.38536617159843445, "loss_vclub": 0.000675201416015625, "parscale_sim": 0.98828125, "step": 443 }, { "epoch": 0.42528735632183906, "grad_norm": 5.994161128997803, "learning_rate": 4.094736842105264e-06, "loss": 0.7522, "step": 444 }, { "epoch": 0.42528735632183906, "loss_full_dim": 0.43907657265663147, "loss_main": 0.8975226879119873, "loss_parscale": 0.8984375, "loss_sub_dim": 0.45844611525535583, "loss_vclub": 0.000537872314453125, "parscale_sim": 0.98828125, "step": 444 }, { "epoch": 0.42624521072796934, "grad_norm": 76.68180084228516, "learning_rate": 4.092105263157895e-06, "loss": 0.8975, "step": 445 }, { "epoch": 0.42624521072796934, "loss_full_dim": 0.381888210773468, "loss_main": 0.7810176610946655, "loss_parscale": 0.80078125, "loss_sub_dim": 0.3991294503211975, "loss_vclub": 0.0005645751953125, "parscale_sim": 0.984375, "step": 445 }, { "epoch": 0.4272030651340996, "grad_norm": 7.897893905639648, "learning_rate": 4.089473684210527e-06, "loss": 0.781, "step": 446 }, { "epoch": 0.4272030651340996, "loss_full_dim": 0.4476184844970703, "loss_main": 0.9165661334991455, "loss_parscale": 0.9140625, "loss_sub_dim": 0.4689476788043976, "loss_vclub": 0.000629425048828125, "parscale_sim": 0.98046875, "step": 446 }, { "epoch": 0.4281609195402299, "grad_norm": 7.941000938415527, "learning_rate": 4.086842105263159e-06, "loss": 0.9166, "step": 447 }, { "epoch": 0.4281609195402299, "loss_full_dim": 0.37852218747138977, "loss_main": 0.7737925052642822, "loss_parscale": 0.7734375, "loss_sub_dim": 0.39527028799057007, "loss_vclub": 0.000732421875, "parscale_sim": 0.98828125, "step": 447 }, { "epoch": 0.42911877394636017, "grad_norm": 7.211135387420654, "learning_rate": 4.08421052631579e-06, "loss": 0.7738, "step": 448 }, { "epoch": 0.42911877394636017, "loss_full_dim": 0.4049410820007324, "loss_main": 0.8295608162879944, "loss_parscale": 0.8359375, "loss_sub_dim": 0.42461973428726196, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.984375, "step": 448 }, { "epoch": 0.43007662835249044, "grad_norm": 10.497943878173828, "learning_rate": 4.081578947368421e-06, "loss": 0.8296, "step": 449 }, { "epoch": 0.43007662835249044, "loss_full_dim": 0.46161654591560364, "loss_main": 0.9445170760154724, "loss_parscale": 0.921875, "loss_sub_dim": 0.4829005300998688, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.98046875, "step": 449 }, { "epoch": 0.43103448275862066, "grad_norm": 32.002784729003906, "learning_rate": 4.078947368421053e-06, "loss": 0.9445, "step": 450 }, { "epoch": 0.43103448275862066, "loss_full_dim": 0.38209474086761475, "loss_main": 0.7811105847358704, "loss_parscale": 0.78515625, "loss_sub_dim": 0.3990158438682556, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.98828125, "step": 450 }, { "epoch": 0.43199233716475094, "grad_norm": 8.485442161560059, "learning_rate": 4.076315789473684e-06, "loss": 0.7811, "step": 451 }, { "epoch": 0.43199233716475094, "loss_full_dim": 0.43027234077453613, "loss_main": 0.878991961479187, "loss_parscale": 0.8828125, "loss_sub_dim": 0.4487196207046509, "loss_vclub": 0.000507354736328125, "parscale_sim": 0.984375, "step": 451 }, { "epoch": 0.4329501915708812, "grad_norm": 9.799806594848633, "learning_rate": 4.073684210526316e-06, "loss": 0.879, "step": 452 }, { "epoch": 0.4329501915708812, "loss_full_dim": 0.4535713493824005, "loss_main": 0.9234437942504883, "loss_parscale": 0.9296875, "loss_sub_dim": 0.4698724150657654, "loss_vclub": 0.0006103515625, "parscale_sim": 0.9921875, "step": 452 }, { "epoch": 0.4339080459770115, "grad_norm": 8.43388557434082, "learning_rate": 4.0710526315789475e-06, "loss": 0.9234, "step": 453 }, { "epoch": 0.4339080459770115, "loss_full_dim": 0.3926011919975281, "loss_main": 0.8019375205039978, "loss_parscale": 0.8046875, "loss_sub_dim": 0.4093363285064697, "loss_vclub": 0.00064849853515625, "parscale_sim": 0.98828125, "step": 453 }, { "epoch": 0.43486590038314177, "grad_norm": 8.49964427947998, "learning_rate": 4.0684210526315795e-06, "loss": 0.8019, "step": 454 }, { "epoch": 0.43486590038314177, "loss_full_dim": 0.44309717416763306, "loss_main": 0.9073010683059692, "loss_parscale": 0.90625, "loss_sub_dim": 0.46420392394065857, "loss_vclub": 0.00061798095703125, "parscale_sim": 0.98828125, "step": 454 }, { "epoch": 0.43582375478927204, "grad_norm": 7.776839733123779, "learning_rate": 4.065789473684211e-06, "loss": 0.9073, "step": 455 }, { "epoch": 0.43582375478927204, "loss_full_dim": 0.4280761182308197, "loss_main": 0.8754653334617615, "loss_parscale": 0.890625, "loss_sub_dim": 0.4473892152309418, "loss_vclub": 0.00064849853515625, "parscale_sim": 0.984375, "step": 455 }, { "epoch": 0.4367816091954023, "grad_norm": 10.081803321838379, "learning_rate": 4.063157894736842e-06, "loss": 0.8755, "step": 456 }, { "epoch": 0.4367816091954023, "loss_full_dim": 0.4180128574371338, "loss_main": 0.8552014827728271, "loss_parscale": 0.859375, "loss_sub_dim": 0.43718865513801575, "loss_vclub": 0.00048828125, "parscale_sim": 0.98828125, "step": 456 }, { "epoch": 0.43773946360153254, "grad_norm": 8.504680633544922, "learning_rate": 4.060526315789474e-06, "loss": 0.8552, "step": 457 }, { "epoch": 0.43773946360153254, "loss_full_dim": 0.3450942635536194, "loss_main": 0.7071056365966797, "loss_parscale": 0.71484375, "loss_sub_dim": 0.3620113730430603, "loss_vclub": 0.000514984130859375, "parscale_sim": 0.984375, "step": 457 }, { "epoch": 0.4386973180076628, "grad_norm": 9.040584564208984, "learning_rate": 4.057894736842106e-06, "loss": 0.7071, "step": 458 }, { "epoch": 0.4386973180076628, "loss_full_dim": 0.3953726887702942, "loss_main": 0.8076515197753906, "loss_parscale": 0.81640625, "loss_sub_dim": 0.41227880120277405, "loss_vclub": 0.00067138671875, "parscale_sim": 0.9921875, "step": 458 }, { "epoch": 0.4396551724137931, "grad_norm": 8.10900592803955, "learning_rate": 4.055263157894737e-06, "loss": 0.8077, "step": 459 }, { "epoch": 0.4396551724137931, "loss_full_dim": 0.3984360992908478, "loss_main": 0.8132420778274536, "loss_parscale": 0.8203125, "loss_sub_dim": 0.41480594873428345, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98828125, "step": 459 }, { "epoch": 0.44061302681992337, "grad_norm": 8.010199546813965, "learning_rate": 4.052631578947368e-06, "loss": 0.8132, "step": 460 }, { "epoch": 0.44061302681992337, "loss_full_dim": 0.4138461649417877, "loss_main": 0.8473191261291504, "loss_parscale": 0.8515625, "loss_sub_dim": 0.43347299098968506, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.984375, "step": 460 }, { "epoch": 0.44157088122605365, "grad_norm": 7.907596588134766, "learning_rate": 4.05e-06, "loss": 0.8473, "step": 461 }, { "epoch": 0.44157088122605365, "loss_full_dim": 0.44065409898757935, "loss_main": 0.9039369821548462, "loss_parscale": 0.90625, "loss_sub_dim": 0.46328288316726685, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.984375, "step": 461 }, { "epoch": 0.4425287356321839, "grad_norm": 7.662137031555176, "learning_rate": 4.047368421052632e-06, "loss": 0.9039, "step": 462 }, { "epoch": 0.4425287356321839, "loss_full_dim": 0.45918920636177063, "loss_main": 0.9437543749809265, "loss_parscale": 0.921875, "loss_sub_dim": 0.4845651686191559, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.984375, "step": 462 }, { "epoch": 0.4434865900383142, "grad_norm": 14.039395332336426, "learning_rate": 4.044736842105263e-06, "loss": 0.9438, "step": 463 }, { "epoch": 0.4434865900383142, "loss_full_dim": 0.3796301782131195, "loss_main": 0.7793662548065186, "loss_parscale": 0.7734375, "loss_sub_dim": 0.39973607659339905, "loss_vclub": 0.00052642822265625, "parscale_sim": 0.98828125, "step": 463 }, { "epoch": 0.4444444444444444, "grad_norm": 9.020685195922852, "learning_rate": 4.042105263157895e-06, "loss": 0.7794, "step": 464 }, { "epoch": 0.4444444444444444, "loss_full_dim": 0.4763851463794708, "loss_main": 0.975766122341156, "loss_parscale": 0.984375, "loss_sub_dim": 0.4993809759616852, "loss_vclub": 0.0006256103515625, "parscale_sim": 0.98828125, "step": 464 }, { "epoch": 0.4454022988505747, "grad_norm": 10.51294994354248, "learning_rate": 4.0394736842105265e-06, "loss": 0.9758, "step": 465 }, { "epoch": 0.4454022988505747, "loss_full_dim": 0.3879341781139374, "loss_main": 0.7946592569351196, "loss_parscale": 0.8046875, "loss_sub_dim": 0.40672504901885986, "loss_vclub": 0.000640869140625, "parscale_sim": 0.984375, "step": 465 }, { "epoch": 0.446360153256705, "grad_norm": 7.748394012451172, "learning_rate": 4.0368421052631585e-06, "loss": 0.7947, "step": 466 }, { "epoch": 0.446360153256705, "loss_full_dim": 0.4957222640514374, "loss_main": 1.0120422840118408, "loss_parscale": 1.0390625, "loss_sub_dim": 0.516319990158081, "loss_vclub": 0.000659942626953125, "parscale_sim": 0.9921875, "step": 466 }, { "epoch": 0.44731800766283525, "grad_norm": 9.309063911437988, "learning_rate": 4.03421052631579e-06, "loss": 1.012, "step": 467 }, { "epoch": 0.44731800766283525, "loss_full_dim": 0.4652417302131653, "loss_main": 0.957604706287384, "loss_parscale": 0.96875, "loss_sub_dim": 0.49236297607421875, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.9921875, "step": 467 }, { "epoch": 0.4482758620689655, "grad_norm": 9.733976364135742, "learning_rate": 4.031578947368422e-06, "loss": 0.9576, "step": 468 }, { "epoch": 0.4482758620689655, "loss_full_dim": 0.5266444683074951, "loss_main": 1.0866683721542358, "loss_parscale": 1.078125, "loss_sub_dim": 0.5600239038467407, "loss_vclub": 0.000705718994140625, "parscale_sim": 0.98046875, "step": 468 }, { "epoch": 0.4492337164750958, "grad_norm": 12.135215759277344, "learning_rate": 4.028947368421053e-06, "loss": 1.0867, "step": 469 }, { "epoch": 0.4492337164750958, "loss_full_dim": 0.4485056400299072, "loss_main": 0.9245826601982117, "loss_parscale": 0.9140625, "loss_sub_dim": 0.47607702016830444, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.984375, "step": 469 }, { "epoch": 0.4501915708812261, "grad_norm": 29.90410041809082, "learning_rate": 4.026315789473684e-06, "loss": 0.9246, "step": 470 }, { "epoch": 0.4501915708812261, "loss_full_dim": 0.4398793578147888, "loss_main": 0.9026653170585632, "loss_parscale": 0.9296875, "loss_sub_dim": 0.4627859592437744, "loss_vclub": 0.000812530517578125, "parscale_sim": 0.98828125, "step": 470 }, { "epoch": 0.4511494252873563, "grad_norm": 8.7228364944458, "learning_rate": 4.023684210526316e-06, "loss": 0.9027, "step": 471 }, { "epoch": 0.4511494252873563, "loss_full_dim": 0.42775294184684753, "loss_main": 0.8751533031463623, "loss_parscale": 0.875, "loss_sub_dim": 0.4474003314971924, "loss_vclub": 0.00084686279296875, "parscale_sim": 0.98828125, "step": 471 }, { "epoch": 0.4521072796934866, "grad_norm": 5.667320728302002, "learning_rate": 4.021052631578948e-06, "loss": 0.8752, "step": 472 }, { "epoch": 0.4521072796934866, "loss_full_dim": 0.48940664529800415, "loss_main": 1.0064458847045898, "loss_parscale": 1.015625, "loss_sub_dim": 0.5170392394065857, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.984375, "step": 472 }, { "epoch": 0.45306513409961685, "grad_norm": 7.307234764099121, "learning_rate": 4.018421052631579e-06, "loss": 1.0064, "step": 473 }, { "epoch": 0.45306513409961685, "loss_full_dim": 0.47946929931640625, "loss_main": 0.9789903163909912, "loss_parscale": 0.97265625, "loss_sub_dim": 0.49952101707458496, "loss_vclub": 0.000858306884765625, "parscale_sim": 0.9921875, "step": 473 }, { "epoch": 0.4540229885057471, "grad_norm": 9.50627613067627, "learning_rate": 4.01578947368421e-06, "loss": 0.979, "step": 474 }, { "epoch": 0.4540229885057471, "loss_full_dim": 0.5669803023338318, "loss_main": 1.1611061096191406, "loss_parscale": 1.1484375, "loss_sub_dim": 0.5941258668899536, "loss_vclub": 0.000579833984375, "parscale_sim": 0.98828125, "step": 474 }, { "epoch": 0.4549808429118774, "grad_norm": 63.10331344604492, "learning_rate": 4.013157894736842e-06, "loss": 1.1611, "step": 475 }, { "epoch": 0.4549808429118774, "loss_full_dim": 0.4866257309913635, "loss_main": 1.0015432834625244, "loss_parscale": 1.0, "loss_sub_dim": 0.5149176120758057, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.98828125, "step": 475 }, { "epoch": 0.4559386973180077, "grad_norm": 10.005372047424316, "learning_rate": 4.010526315789474e-06, "loss": 1.0015, "step": 476 }, { "epoch": 0.4559386973180077, "loss_full_dim": 0.4117278456687927, "loss_main": 0.8461319208145142, "loss_parscale": 0.859375, "loss_sub_dim": 0.43440404534339905, "loss_vclub": 0.00083160400390625, "parscale_sim": 0.9921875, "step": 476 }, { "epoch": 0.45689655172413796, "grad_norm": 8.000143051147461, "learning_rate": 4.0078947368421055e-06, "loss": 0.8461, "step": 477 }, { "epoch": 0.45689655172413796, "loss_full_dim": 0.44900229573249817, "loss_main": 0.9241607189178467, "loss_parscale": 0.9453125, "loss_sub_dim": 0.4751583933830261, "loss_vclub": 0.00054168701171875, "parscale_sim": 0.9921875, "step": 477 }, { "epoch": 0.4578544061302682, "grad_norm": 8.582259178161621, "learning_rate": 4.005263157894737e-06, "loss": 0.9242, "step": 478 }, { "epoch": 0.4578544061302682, "loss_full_dim": 0.43659594655036926, "loss_main": 0.8952489495277405, "loss_parscale": 0.90625, "loss_sub_dim": 0.4586530029773712, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.98828125, "step": 478 }, { "epoch": 0.45881226053639845, "grad_norm": 10.76664924621582, "learning_rate": 4.002631578947369e-06, "loss": 0.8952, "step": 479 }, { "epoch": 0.45881226053639845, "loss_full_dim": 0.4489383399486542, "loss_main": 0.9216482639312744, "loss_parscale": 0.921875, "loss_sub_dim": 0.4727099537849426, "loss_vclub": 0.000492095947265625, "parscale_sim": 0.98828125, "step": 479 }, { "epoch": 0.45977011494252873, "grad_norm": 133.8269500732422, "learning_rate": 4.000000000000001e-06, "loss": 0.9216, "step": 480 }, { "epoch": 0.45977011494252873, "loss_full_dim": 0.39964717626571655, "loss_main": 0.8208923935890198, "loss_parscale": 0.859375, "loss_sub_dim": 0.4212452173233032, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.98828125, "step": 480 }, { "epoch": 0.460727969348659, "grad_norm": 10.511771202087402, "learning_rate": 3.997368421052632e-06, "loss": 0.8209, "step": 481 }, { "epoch": 0.460727969348659, "loss_full_dim": 0.4259560704231262, "loss_main": 0.8728632926940918, "loss_parscale": 0.8828125, "loss_sub_dim": 0.4469072222709656, "loss_vclub": 0.000789642333984375, "parscale_sim": 0.9921875, "step": 481 }, { "epoch": 0.4616858237547893, "grad_norm": 8.862483024597168, "learning_rate": 3.994736842105264e-06, "loss": 0.8729, "step": 482 }, { "epoch": 0.4616858237547893, "loss_full_dim": 0.4262685775756836, "loss_main": 0.8733706474304199, "loss_parscale": 0.8984375, "loss_sub_dim": 0.44710206985473633, "loss_vclub": 0.00072479248046875, "parscale_sim": 0.984375, "step": 482 }, { "epoch": 0.46264367816091956, "grad_norm": 9.983879089355469, "learning_rate": 3.992105263157895e-06, "loss": 0.8734, "step": 483 }, { "epoch": 0.46264367816091956, "loss_full_dim": 0.40023720264434814, "loss_main": 0.8206837773323059, "loss_parscale": 0.828125, "loss_sub_dim": 0.42044657468795776, "loss_vclub": 0.000637054443359375, "parscale_sim": 0.9921875, "step": 483 }, { "epoch": 0.46360153256704983, "grad_norm": 8.773262023925781, "learning_rate": 3.989473684210526e-06, "loss": 0.8207, "step": 484 }, { "epoch": 0.46360153256704983, "loss_full_dim": 0.384526789188385, "loss_main": 0.7883957624435425, "loss_parscale": 0.796875, "loss_sub_dim": 0.40386900305747986, "loss_vclub": 0.000759124755859375, "parscale_sim": 0.98828125, "step": 484 }, { "epoch": 0.46455938697318006, "grad_norm": 7.071913242340088, "learning_rate": 3.986842105263158e-06, "loss": 0.7884, "step": 485 }, { "epoch": 0.46455938697318006, "loss_full_dim": 0.3410552144050598, "loss_main": 0.7013222575187683, "loss_parscale": 0.71875, "loss_sub_dim": 0.3602670431137085, "loss_vclub": 0.000629425048828125, "parscale_sim": 0.98828125, "step": 485 }, { "epoch": 0.46551724137931033, "grad_norm": 8.0024995803833, "learning_rate": 3.98421052631579e-06, "loss": 0.7013, "step": 486 }, { "epoch": 0.46551724137931033, "loss_full_dim": 0.39897459745407104, "loss_main": 0.8224575519561768, "loss_parscale": 0.8359375, "loss_sub_dim": 0.4234829545021057, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.984375, "step": 486 }, { "epoch": 0.4664750957854406, "grad_norm": 13.31377124786377, "learning_rate": 3.981578947368421e-06, "loss": 0.8225, "step": 487 }, { "epoch": 0.4664750957854406, "loss_full_dim": 0.36620062589645386, "loss_main": 0.7538900375366211, "loss_parscale": 0.75390625, "loss_sub_dim": 0.38768941164016724, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.98828125, "step": 487 }, { "epoch": 0.4674329501915709, "grad_norm": 8.689013481140137, "learning_rate": 3.9789473684210525e-06, "loss": 0.7539, "step": 488 }, { "epoch": 0.4674329501915709, "loss_full_dim": 0.41435110569000244, "loss_main": 0.8499876260757446, "loss_parscale": 0.8515625, "loss_sub_dim": 0.4356365203857422, "loss_vclub": 0.00067138671875, "parscale_sim": 0.98046875, "step": 488 }, { "epoch": 0.46839080459770116, "grad_norm": 9.909832000732422, "learning_rate": 3.9763157894736845e-06, "loss": 0.85, "step": 489 }, { "epoch": 0.46839080459770116, "loss_full_dim": 0.4691178500652313, "loss_main": 0.9596928358078003, "loss_parscale": 0.9609375, "loss_sub_dim": 0.4905749559402466, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.9921875, "step": 489 }, { "epoch": 0.46934865900383144, "grad_norm": 18.007051467895508, "learning_rate": 3.9736842105263165e-06, "loss": 0.9597, "step": 490 }, { "epoch": 0.46934865900383144, "loss_full_dim": 0.3997504711151123, "loss_main": 0.8201595544815063, "loss_parscale": 0.8125, "loss_sub_dim": 0.42040905356407166, "loss_vclub": 0.000705718994140625, "parscale_sim": 0.984375, "step": 490 }, { "epoch": 0.4703065134099617, "grad_norm": 6.527791976928711, "learning_rate": 3.971052631578948e-06, "loss": 0.8202, "step": 491 }, { "epoch": 0.4703065134099617, "loss_full_dim": 0.4439392387866974, "loss_main": 0.9062317609786987, "loss_parscale": 0.9140625, "loss_sub_dim": 0.46229249238967896, "loss_vclub": 0.000637054443359375, "parscale_sim": 0.98828125, "step": 491 }, { "epoch": 0.47126436781609193, "grad_norm": 7.109913349151611, "learning_rate": 3.968421052631579e-06, "loss": 0.9062, "step": 492 }, { "epoch": 0.47126436781609193, "loss_full_dim": 0.3920830190181732, "loss_main": 0.8015706539154053, "loss_parscale": 0.796875, "loss_sub_dim": 0.40948766469955444, "loss_vclub": 0.000637054443359375, "parscale_sim": 0.9921875, "step": 492 }, { "epoch": 0.4722222222222222, "grad_norm": 11.786262512207031, "learning_rate": 3.965789473684211e-06, "loss": 0.8016, "step": 493 }, { "epoch": 0.4722222222222222, "loss_full_dim": 0.5078076720237732, "loss_main": 1.0408761501312256, "loss_parscale": 1.046875, "loss_sub_dim": 0.5330685377120972, "loss_vclub": 0.000667572021484375, "parscale_sim": 0.9609375, "step": 493 }, { "epoch": 0.4731800766283525, "grad_norm": 15.11909008026123, "learning_rate": 3.963157894736843e-06, "loss": 1.0409, "step": 494 }, { "epoch": 0.4731800766283525, "loss_full_dim": 0.4381040334701538, "loss_main": 0.9001926779747009, "loss_parscale": 0.9375, "loss_sub_dim": 0.4620886445045471, "loss_vclub": 0.00064849853515625, "parscale_sim": 0.984375, "step": 494 }, { "epoch": 0.47413793103448276, "grad_norm": 8.526082992553711, "learning_rate": 3.960526315789474e-06, "loss": 0.9002, "step": 495 }, { "epoch": 0.47413793103448276, "loss_full_dim": 0.4737030267715454, "loss_main": 0.9695696830749512, "loss_parscale": 0.98046875, "loss_sub_dim": 0.49586665630340576, "loss_vclub": 0.000591278076171875, "parscale_sim": 0.98828125, "step": 495 }, { "epoch": 0.47509578544061304, "grad_norm": 8.647832870483398, "learning_rate": 3.957894736842106e-06, "loss": 0.9696, "step": 496 }, { "epoch": 0.47509578544061304, "loss_full_dim": 0.40522778034210205, "loss_main": 0.8319472074508667, "loss_parscale": 0.828125, "loss_sub_dim": 0.42671942710876465, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.98828125, "step": 496 }, { "epoch": 0.4760536398467433, "grad_norm": 8.32548713684082, "learning_rate": 3.955263157894737e-06, "loss": 0.8319, "step": 497 }, { "epoch": 0.4760536398467433, "loss_full_dim": 0.4003702998161316, "loss_main": 0.8200864791870117, "loss_parscale": 0.82421875, "loss_sub_dim": 0.41971614956855774, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.98828125, "step": 497 }, { "epoch": 0.47701149425287354, "grad_norm": 10.860148429870605, "learning_rate": 3.952631578947368e-06, "loss": 0.8201, "step": 498 }, { "epoch": 0.47701149425287354, "loss_full_dim": 0.388689249753952, "loss_main": 0.7957452535629272, "loss_parscale": 0.7890625, "loss_sub_dim": 0.4070560336112976, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.984375, "step": 498 }, { "epoch": 0.4779693486590038, "grad_norm": 8.925423622131348, "learning_rate": 3.95e-06, "loss": 0.7957, "step": 499 }, { "epoch": 0.4779693486590038, "loss_full_dim": 0.37991398572921753, "loss_main": 0.7755700349807739, "loss_parscale": 0.7734375, "loss_sub_dim": 0.3956560492515564, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.98828125, "step": 499 }, { "epoch": 0.4789272030651341, "grad_norm": 7.318690299987793, "learning_rate": 3.947368421052632e-06, "loss": 0.7756, "step": 500 }, { "epoch": 0.4789272030651341, "loss_full_dim": 0.3979489803314209, "loss_main": 0.8158926963806152, "loss_parscale": 0.8125, "loss_sub_dim": 0.41794371604919434, "loss_vclub": 0.000598907470703125, "parscale_sim": 0.9921875, "step": 500 }, { "epoch": 0.47988505747126436, "grad_norm": 6.421666622161865, "learning_rate": 3.9447368421052635e-06, "loss": 0.8159, "step": 501 }, { "epoch": 0.47988505747126436, "loss_full_dim": 0.346463680267334, "loss_main": 0.7125113606452942, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3660476803779602, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.98828125, "step": 501 }, { "epoch": 0.48084291187739464, "grad_norm": 9.621811866760254, "learning_rate": 3.942105263157895e-06, "loss": 0.7125, "step": 502 }, { "epoch": 0.48084291187739464, "loss_full_dim": 0.449296236038208, "loss_main": 0.9192360639572144, "loss_parscale": 0.9140625, "loss_sub_dim": 0.46993982791900635, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.984375, "step": 502 }, { "epoch": 0.4818007662835249, "grad_norm": 22.965505599975586, "learning_rate": 3.939473684210527e-06, "loss": 0.9192, "step": 503 }, { "epoch": 0.4818007662835249, "loss_full_dim": 0.4547256827354431, "loss_main": 0.9330440759658813, "loss_parscale": 0.9140625, "loss_sub_dim": 0.47831839323043823, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.95703125, "step": 503 }, { "epoch": 0.4827586206896552, "grad_norm": 23.591094970703125, "learning_rate": 3.936842105263159e-06, "loss": 0.933, "step": 504 }, { "epoch": 0.4827586206896552, "loss_full_dim": 0.35399141907691956, "loss_main": 0.7266026735305786, "loss_parscale": 0.71875, "loss_sub_dim": 0.37261122465133667, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.98828125, "step": 504 }, { "epoch": 0.4837164750957854, "grad_norm": 7.96452522277832, "learning_rate": 3.93421052631579e-06, "loss": 0.7266, "step": 505 }, { "epoch": 0.4837164750957854, "loss_full_dim": 0.35939326882362366, "loss_main": 0.7361675500869751, "loss_parscale": 0.75, "loss_sub_dim": 0.37677425146102905, "loss_vclub": 0.00058746337890625, "parscale_sim": 0.98828125, "step": 505 }, { "epoch": 0.4846743295019157, "grad_norm": 7.959946155548096, "learning_rate": 3.931578947368421e-06, "loss": 0.7362, "step": 506 }, { "epoch": 0.4846743295019157, "loss_full_dim": 0.42820680141448975, "loss_main": 0.8765750527381897, "loss_parscale": 0.8828125, "loss_sub_dim": 0.44836825132369995, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.9609375, "step": 506 }, { "epoch": 0.48563218390804597, "grad_norm": 19.0102596282959, "learning_rate": 3.928947368421053e-06, "loss": 0.8766, "step": 507 }, { "epoch": 0.48563218390804597, "loss_full_dim": 0.37232130765914917, "loss_main": 0.7643032073974609, "loss_parscale": 0.7734375, "loss_sub_dim": 0.39198189973831177, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.984375, "step": 507 }, { "epoch": 0.48659003831417624, "grad_norm": 29.501436233520508, "learning_rate": 3.926315789473685e-06, "loss": 0.7643, "step": 508 }, { "epoch": 0.48659003831417624, "loss_full_dim": 0.41394883394241333, "loss_main": 0.851944088935852, "loss_parscale": 0.859375, "loss_sub_dim": 0.43799522519111633, "loss_vclub": 0.00064849853515625, "parscale_sim": 0.984375, "step": 508 }, { "epoch": 0.4875478927203065, "grad_norm": 8.266843795776367, "learning_rate": 3.923684210526316e-06, "loss": 0.8519, "step": 509 }, { "epoch": 0.4875478927203065, "loss_full_dim": 0.4628659188747406, "loss_main": 0.9449567794799805, "loss_parscale": 0.9453125, "loss_sub_dim": 0.48209089040756226, "loss_vclub": 0.00061798095703125, "parscale_sim": 0.98828125, "step": 509 }, { "epoch": 0.4885057471264368, "grad_norm": 9.001152038574219, "learning_rate": 3.921052631578947e-06, "loss": 0.945, "step": 510 }, { "epoch": 0.4885057471264368, "loss_full_dim": 0.4470524787902832, "loss_main": 0.9146796464920044, "loss_parscale": 0.9140625, "loss_sub_dim": 0.4676271677017212, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.98828125, "step": 510 }, { "epoch": 0.48946360153256707, "grad_norm": 28.911087036132812, "learning_rate": 3.918421052631579e-06, "loss": 0.9147, "step": 511 }, { "epoch": 0.48946360153256707, "loss_full_dim": 0.3535180389881134, "loss_main": 0.7254082560539246, "loss_parscale": 0.734375, "loss_sub_dim": 0.37189021706581116, "loss_vclub": 0.00072479248046875, "parscale_sim": 0.98828125, "step": 511 }, { "epoch": 0.4904214559386973, "grad_norm": 9.468965530395508, "learning_rate": 3.9157894736842104e-06, "loss": 0.7254, "step": 512 }, { "epoch": 0.4904214559386973, "loss_full_dim": 0.42339709401130676, "loss_main": 0.8646519780158997, "loss_parscale": 0.88671875, "loss_sub_dim": 0.4412548840045929, "loss_vclub": 0.000598907470703125, "parscale_sim": 0.9921875, "step": 512 }, { "epoch": 0.49137931034482757, "grad_norm": 8.307242393493652, "learning_rate": 3.9131578947368424e-06, "loss": 0.8647, "step": 513 }, { "epoch": 0.49137931034482757, "loss_full_dim": 0.4220987856388092, "loss_main": 0.8611315488815308, "loss_parscale": 0.8671875, "loss_sub_dim": 0.43903273344039917, "loss_vclub": 0.000705718994140625, "parscale_sim": 0.984375, "step": 513 }, { "epoch": 0.49233716475095785, "grad_norm": 17.671873092651367, "learning_rate": 3.9105263157894744e-06, "loss": 0.8611, "step": 514 }, { "epoch": 0.49233716475095785, "loss_full_dim": 0.4462484121322632, "loss_main": 0.9117576479911804, "loss_parscale": 0.8984375, "loss_sub_dim": 0.46550923585891724, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.98828125, "step": 514 }, { "epoch": 0.4932950191570881, "grad_norm": 8.169134140014648, "learning_rate": 3.907894736842106e-06, "loss": 0.9118, "step": 515 }, { "epoch": 0.4932950191570881, "loss_full_dim": 0.3707517385482788, "loss_main": 0.7592668533325195, "loss_parscale": 0.765625, "loss_sub_dim": 0.38851508498191833, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.9921875, "step": 515 }, { "epoch": 0.4942528735632184, "grad_norm": 5.225532531738281, "learning_rate": 3.905263157894737e-06, "loss": 0.7593, "step": 516 }, { "epoch": 0.4942528735632184, "loss_full_dim": 0.40030211210250854, "loss_main": 0.8230563998222351, "loss_parscale": 0.828125, "loss_sub_dim": 0.42275428771972656, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.98828125, "step": 516 }, { "epoch": 0.4952107279693487, "grad_norm": 6.497913837432861, "learning_rate": 3.902631578947369e-06, "loss": 0.8231, "step": 517 }, { "epoch": 0.4952107279693487, "loss_full_dim": 0.3780896067619324, "loss_main": 0.7744900584220886, "loss_parscale": 0.78125, "loss_sub_dim": 0.39640045166015625, "loss_vclub": 0.000701904296875, "parscale_sim": 0.98828125, "step": 517 }, { "epoch": 0.49616858237547895, "grad_norm": 22.71976089477539, "learning_rate": 3.900000000000001e-06, "loss": 0.7745, "step": 518 }, { "epoch": 0.49616858237547895, "loss_full_dim": 0.3502586781978607, "loss_main": 0.7167520523071289, "loss_parscale": 0.7109375, "loss_sub_dim": 0.3664934039115906, "loss_vclub": 0.000701904296875, "parscale_sim": 0.98828125, "step": 518 }, { "epoch": 0.49712643678160917, "grad_norm": 8.293785095214844, "learning_rate": 3.897368421052632e-06, "loss": 0.7168, "step": 519 }, { "epoch": 0.49712643678160917, "loss_full_dim": 0.31231072545051575, "loss_main": 0.6399657726287842, "loss_parscale": 0.640625, "loss_sub_dim": 0.3276550769805908, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.98828125, "step": 519 }, { "epoch": 0.49808429118773945, "grad_norm": 6.954294681549072, "learning_rate": 3.894736842105263e-06, "loss": 0.64, "step": 520 }, { "epoch": 0.49808429118773945, "loss_full_dim": 0.34570854902267456, "loss_main": 0.711129903793335, "loss_parscale": 0.7109375, "loss_sub_dim": 0.3654213547706604, "loss_vclub": 0.000518798828125, "parscale_sim": 0.98828125, "step": 520 }, { "epoch": 0.4990421455938697, "grad_norm": 6.206664562225342, "learning_rate": 3.892105263157895e-06, "loss": 0.7111, "step": 521 }, { "epoch": 0.4990421455938697, "loss_full_dim": 0.402418315410614, "loss_main": 0.8236343264579773, "loss_parscale": 0.828125, "loss_sub_dim": 0.4212160110473633, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.98828125, "step": 521 }, { "epoch": 0.5, "grad_norm": 7.893470764160156, "learning_rate": 3.889473684210527e-06, "loss": 0.8236, "step": 522 }, { "epoch": 0.5, "loss_full_dim": 0.399609237909317, "loss_main": 0.817932665348053, "loss_parscale": 0.82421875, "loss_sub_dim": 0.41832342743873596, "loss_vclub": 0.000759124755859375, "parscale_sim": 0.9921875, "step": 522 }, { "epoch": 0.5009578544061303, "grad_norm": 7.561025142669678, "learning_rate": 3.886842105263158e-06, "loss": 0.8179, "step": 523 }, { "epoch": 0.5009578544061303, "loss_full_dim": 0.34468957781791687, "loss_main": 0.7067384719848633, "loss_parscale": 0.71875, "loss_sub_dim": 0.3620489239692688, "loss_vclub": 0.00060272216796875, "parscale_sim": 0.98828125, "step": 523 }, { "epoch": 0.5019157088122606, "grad_norm": 7.02824068069458, "learning_rate": 3.884210526315789e-06, "loss": 0.7067, "step": 524 }, { "epoch": 0.5019157088122606, "loss_full_dim": 0.43968355655670166, "loss_main": 0.8963159918785095, "loss_parscale": 0.90625, "loss_sub_dim": 0.45663243532180786, "loss_vclub": 0.00067138671875, "parscale_sim": 0.98828125, "step": 524 }, { "epoch": 0.5028735632183908, "grad_norm": 11.62259292602539, "learning_rate": 3.8815789473684214e-06, "loss": 0.8963, "step": 525 }, { "epoch": 0.5028735632183908, "loss_full_dim": 0.3869653642177582, "loss_main": 0.7913620471954346, "loss_parscale": 0.79296875, "loss_sub_dim": 0.404396653175354, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.9921875, "step": 525 }, { "epoch": 0.5038314176245211, "grad_norm": 7.521389961242676, "learning_rate": 3.878947368421053e-06, "loss": 0.7914, "step": 526 }, { "epoch": 0.5038314176245211, "loss_full_dim": 0.394290953874588, "loss_main": 0.8092786073684692, "loss_parscale": 0.8125, "loss_sub_dim": 0.41498762369155884, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.98828125, "step": 526 }, { "epoch": 0.5047892720306514, "grad_norm": 7.2915425300598145, "learning_rate": 3.876315789473685e-06, "loss": 0.8093, "step": 527 }, { "epoch": 0.5047892720306514, "loss_full_dim": 0.3782840967178345, "loss_main": 0.7737714648246765, "loss_parscale": 0.7734375, "loss_sub_dim": 0.39548736810684204, "loss_vclub": 0.0006103515625, "parscale_sim": 0.98828125, "step": 527 }, { "epoch": 0.5057471264367817, "grad_norm": 7.985857963562012, "learning_rate": 3.873684210526316e-06, "loss": 0.7738, "step": 528 }, { "epoch": 0.5057471264367817, "loss_full_dim": 0.4281919598579407, "loss_main": 0.8750128746032715, "loss_parscale": 0.890625, "loss_sub_dim": 0.4468208849430084, "loss_vclub": 0.000812530517578125, "parscale_sim": 0.98828125, "step": 528 }, { "epoch": 0.5067049808429118, "grad_norm": 15.993897438049316, "learning_rate": 3.871052631578948e-06, "loss": 0.875, "step": 529 }, { "epoch": 0.5067049808429118, "loss_full_dim": 0.4345497786998749, "loss_main": 0.8865488767623901, "loss_parscale": 0.8671875, "loss_sub_dim": 0.45199906826019287, "loss_vclub": 0.000640869140625, "parscale_sim": 0.98828125, "step": 529 }, { "epoch": 0.5076628352490421, "grad_norm": 25.865110397338867, "learning_rate": 3.868421052631579e-06, "loss": 0.8865, "step": 530 }, { "epoch": 0.5076628352490421, "loss_full_dim": 0.3849673867225647, "loss_main": 0.7937564253807068, "loss_parscale": 0.796875, "loss_sub_dim": 0.4087890386581421, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.984375, "step": 530 }, { "epoch": 0.5086206896551724, "grad_norm": 8.55898380279541, "learning_rate": 3.865789473684211e-06, "loss": 0.7938, "step": 531 }, { "epoch": 0.5086206896551724, "loss_full_dim": 0.32983601093292236, "loss_main": 0.6763049364089966, "loss_parscale": 0.6796875, "loss_sub_dim": 0.34646889567375183, "loss_vclub": 0.000965118408203125, "parscale_sim": 0.98828125, "step": 531 }, { "epoch": 0.5095785440613027, "grad_norm": 6.3029985427856445, "learning_rate": 3.863157894736843e-06, "loss": 0.6763, "step": 532 }, { "epoch": 0.5095785440613027, "loss_full_dim": 0.3382895886898041, "loss_main": 0.6932010650634766, "loss_parscale": 0.703125, "loss_sub_dim": 0.3549115061759949, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.9921875, "step": 532 }, { "epoch": 0.5105363984674329, "grad_norm": 9.82427978515625, "learning_rate": 3.860526315789474e-06, "loss": 0.6932, "step": 533 }, { "epoch": 0.5105363984674329, "loss_full_dim": 0.4559482932090759, "loss_main": 0.9329140186309814, "loss_parscale": 0.9296875, "loss_sub_dim": 0.47696569561958313, "loss_vclub": 0.000682830810546875, "parscale_sim": 0.9921875, "step": 533 }, { "epoch": 0.5114942528735632, "grad_norm": 10.924256324768066, "learning_rate": 3.857894736842105e-06, "loss": 0.9329, "step": 534 }, { "epoch": 0.5114942528735632, "loss_full_dim": 0.34798938035964966, "loss_main": 0.7140880227088928, "loss_parscale": 0.71875, "loss_sub_dim": 0.36609864234924316, "loss_vclub": 0.000675201416015625, "parscale_sim": 0.98828125, "step": 534 }, { "epoch": 0.5124521072796935, "grad_norm": 27.449085235595703, "learning_rate": 3.855263157894737e-06, "loss": 0.7141, "step": 535 }, { "epoch": 0.5124521072796935, "loss_full_dim": 0.3609989583492279, "loss_main": 0.7414600849151611, "loss_parscale": 0.7421875, "loss_sub_dim": 0.38046109676361084, "loss_vclub": 0.000820159912109375, "parscale_sim": 0.96484375, "step": 535 }, { "epoch": 0.5134099616858238, "grad_norm": 8.578968048095703, "learning_rate": 3.852631578947369e-06, "loss": 0.7415, "step": 536 }, { "epoch": 0.5134099616858238, "loss_full_dim": 0.40508008003234863, "loss_main": 0.8284769654273987, "loss_parscale": 0.8359375, "loss_sub_dim": 0.42339688539505005, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.98046875, "step": 536 }, { "epoch": 0.514367816091954, "grad_norm": 12.602062225341797, "learning_rate": 3.85e-06, "loss": 0.8285, "step": 537 }, { "epoch": 0.514367816091954, "loss_full_dim": 0.45507603883743286, "loss_main": 0.9321366548538208, "loss_parscale": 0.9296875, "loss_sub_dim": 0.47706061601638794, "loss_vclub": 0.000518798828125, "parscale_sim": 0.984375, "step": 537 }, { "epoch": 0.5153256704980843, "grad_norm": 12.534911155700684, "learning_rate": 3.8473684210526316e-06, "loss": 0.9321, "step": 538 }, { "epoch": 0.5153256704980843, "loss_full_dim": 0.4158463478088379, "loss_main": 0.8481594324111938, "loss_parscale": 0.84375, "loss_sub_dim": 0.43231308460235596, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.9921875, "step": 538 }, { "epoch": 0.5162835249042146, "grad_norm": 9.097540855407715, "learning_rate": 3.8447368421052636e-06, "loss": 0.8482, "step": 539 }, { "epoch": 0.5162835249042146, "loss_full_dim": 0.4309921860694885, "loss_main": 0.8802577257156372, "loss_parscale": 0.875, "loss_sub_dim": 0.4492655098438263, "loss_vclub": 0.000766754150390625, "parscale_sim": 0.98828125, "step": 539 }, { "epoch": 0.5172413793103449, "grad_norm": 8.744942665100098, "learning_rate": 3.842105263157895e-06, "loss": 0.8803, "step": 540 }, { "epoch": 0.5172413793103449, "loss_full_dim": 0.4171324670314789, "loss_main": 0.8528269529342651, "loss_parscale": 0.8515625, "loss_sub_dim": 0.43569451570510864, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.9921875, "step": 540 }, { "epoch": 0.5181992337164751, "grad_norm": 14.316610336303711, "learning_rate": 3.839473684210527e-06, "loss": 0.8528, "step": 541 }, { "epoch": 0.5181992337164751, "loss_full_dim": 0.39955490827560425, "loss_main": 0.8180549144744873, "loss_parscale": 0.8359375, "loss_sub_dim": 0.41849997639656067, "loss_vclub": 0.000701904296875, "parscale_sim": 0.98828125, "step": 541 }, { "epoch": 0.5191570881226054, "grad_norm": 7.526773929595947, "learning_rate": 3.836842105263158e-06, "loss": 0.8181, "step": 542 }, { "epoch": 0.5191570881226054, "loss_full_dim": 0.4557441473007202, "loss_main": 0.9307689666748047, "loss_parscale": 0.9296875, "loss_sub_dim": 0.4750248193740845, "loss_vclub": 0.000766754150390625, "parscale_sim": 0.98828125, "step": 542 }, { "epoch": 0.5201149425287356, "grad_norm": 7.335948467254639, "learning_rate": 3.83421052631579e-06, "loss": 0.9308, "step": 543 }, { "epoch": 0.5201149425287356, "loss_full_dim": 0.4336649775505066, "loss_main": 0.8884449601173401, "loss_parscale": 0.890625, "loss_sub_dim": 0.4547799825668335, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.98828125, "step": 543 }, { "epoch": 0.5210727969348659, "grad_norm": 23.843278884887695, "learning_rate": 3.831578947368421e-06, "loss": 0.8884, "step": 544 }, { "epoch": 0.5210727969348659, "loss_full_dim": 0.37871453166007996, "loss_main": 0.7757532596588135, "loss_parscale": 0.78125, "loss_sub_dim": 0.39703869819641113, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.98828125, "step": 544 }, { "epoch": 0.5220306513409961, "grad_norm": 7.522928714752197, "learning_rate": 3.828947368421053e-06, "loss": 0.7758, "step": 545 }, { "epoch": 0.5220306513409961, "loss_full_dim": 0.39133530855178833, "loss_main": 0.8014429211616516, "loss_parscale": 0.8046875, "loss_sub_dim": 0.4101076126098633, "loss_vclub": 0.000682830810546875, "parscale_sim": 0.984375, "step": 545 }, { "epoch": 0.5229885057471264, "grad_norm": 8.575542449951172, "learning_rate": 3.826315789473685e-06, "loss": 0.8014, "step": 546 }, { "epoch": 0.5229885057471264, "loss_full_dim": 0.44172534346580505, "loss_main": 0.9027389883995056, "loss_parscale": 0.9140625, "loss_sub_dim": 0.46101364493370056, "loss_vclub": 0.00060272216796875, "parscale_sim": 0.9921875, "step": 546 }, { "epoch": 0.5239463601532567, "grad_norm": 39.4542121887207, "learning_rate": 3.823684210526316e-06, "loss": 0.9027, "step": 547 }, { "epoch": 0.5239463601532567, "loss_full_dim": 0.4176591634750366, "loss_main": 0.8543119430541992, "loss_parscale": 0.84375, "loss_sub_dim": 0.4366527497768402, "loss_vclub": 0.000568389892578125, "parscale_sim": 0.984375, "step": 547 }, { "epoch": 0.524904214559387, "grad_norm": 8.457560539245605, "learning_rate": 3.821052631578947e-06, "loss": 0.8543, "step": 548 }, { "epoch": 0.524904214559387, "loss_full_dim": 0.36087682843208313, "loss_main": 0.7410938739776611, "loss_parscale": 0.7734375, "loss_sub_dim": 0.3802170157432556, "loss_vclub": 0.000736236572265625, "parscale_sim": 0.984375, "step": 548 }, { "epoch": 0.5258620689655172, "grad_norm": 9.917919158935547, "learning_rate": 3.818421052631579e-06, "loss": 0.7411, "step": 549 }, { "epoch": 0.5258620689655172, "loss_full_dim": 0.40151193737983704, "loss_main": 0.8205918073654175, "loss_parscale": 0.8046875, "loss_sub_dim": 0.41907989978790283, "loss_vclub": 0.000606536865234375, "parscale_sim": 0.984375, "step": 549 }, { "epoch": 0.5268199233716475, "grad_norm": 7.599835395812988, "learning_rate": 3.815789473684211e-06, "loss": 0.8206, "step": 550 }, { "epoch": 0.5268199233716475, "loss_full_dim": 0.40666165947914124, "loss_main": 0.8309805393218994, "loss_parscale": 0.8359375, "loss_sub_dim": 0.42431890964508057, "loss_vclub": 0.000732421875, "parscale_sim": 0.98828125, "step": 550 }, { "epoch": 0.5277777777777778, "grad_norm": 18.9655704498291, "learning_rate": 3.8131578947368426e-06, "loss": 0.831, "step": 551 }, { "epoch": 0.5277777777777778, "loss_full_dim": 0.40934693813323975, "loss_main": 0.8357685804367065, "loss_parscale": 0.8359375, "loss_sub_dim": 0.4264216423034668, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.9921875, "step": 551 }, { "epoch": 0.5287356321839081, "grad_norm": 34.5404052734375, "learning_rate": 3.810526315789474e-06, "loss": 0.8358, "step": 552 }, { "epoch": 0.5287356321839081, "loss_full_dim": 0.39442357420921326, "loss_main": 0.8072995543479919, "loss_parscale": 0.8046875, "loss_sub_dim": 0.4128759801387787, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.9921875, "step": 552 }, { "epoch": 0.5296934865900383, "grad_norm": 10.381874084472656, "learning_rate": 3.8078947368421053e-06, "loss": 0.8073, "step": 553 }, { "epoch": 0.5296934865900383, "loss_full_dim": 0.3933138847351074, "loss_main": 0.8040543794631958, "loss_parscale": 0.80078125, "loss_sub_dim": 0.410740464925766, "loss_vclub": 0.00067138671875, "parscale_sim": 0.98828125, "step": 553 }, { "epoch": 0.5306513409961686, "grad_norm": 7.8008599281311035, "learning_rate": 3.805263157894737e-06, "loss": 0.8041, "step": 554 }, { "epoch": 0.5306513409961686, "loss_full_dim": 0.3883284628391266, "loss_main": 0.79366135597229, "loss_parscale": 0.8046875, "loss_sub_dim": 0.40533292293548584, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.98828125, "step": 554 }, { "epoch": 0.5316091954022989, "grad_norm": 6.636882305145264, "learning_rate": 3.802631578947369e-06, "loss": 0.7937, "step": 555 }, { "epoch": 0.5316091954022989, "loss_full_dim": 0.4291366636753082, "loss_main": 0.8784884214401245, "loss_parscale": 0.87109375, "loss_sub_dim": 0.4493517279624939, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.984375, "step": 555 }, { "epoch": 0.5325670498084292, "grad_norm": 8.213311195373535, "learning_rate": 3.8000000000000005e-06, "loss": 0.8785, "step": 556 }, { "epoch": 0.5325670498084292, "loss_full_dim": 0.41236650943756104, "loss_main": 0.8441540002822876, "loss_parscale": 0.8515625, "loss_sub_dim": 0.43178749084472656, "loss_vclub": 0.00055694580078125, "parscale_sim": 0.98046875, "step": 556 }, { "epoch": 0.5335249042145593, "grad_norm": 9.235682487487793, "learning_rate": 3.7973684210526316e-06, "loss": 0.8442, "step": 557 }, { "epoch": 0.5335249042145593, "loss_full_dim": 0.37766847014427185, "loss_main": 0.7757677435874939, "loss_parscale": 0.78125, "loss_sub_dim": 0.39809927344322205, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.98828125, "step": 557 }, { "epoch": 0.5344827586206896, "grad_norm": 13.613242149353027, "learning_rate": 3.794736842105263e-06, "loss": 0.7758, "step": 558 }, { "epoch": 0.5344827586206896, "loss_full_dim": 0.4792823791503906, "loss_main": 0.9757659435272217, "loss_parscale": 0.98046875, "loss_sub_dim": 0.49648353457450867, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.98828125, "step": 558 }, { "epoch": 0.5354406130268199, "grad_norm": 8.348362922668457, "learning_rate": 3.792105263157895e-06, "loss": 0.9758, "step": 559 }, { "epoch": 0.5354406130268199, "loss_full_dim": 0.3747255802154541, "loss_main": 0.7671205401420593, "loss_parscale": 0.765625, "loss_sub_dim": 0.3923949599266052, "loss_vclub": 0.000720977783203125, "parscale_sim": 0.984375, "step": 559 }, { "epoch": 0.5363984674329502, "grad_norm": 5.3998942375183105, "learning_rate": 3.789473684210527e-06, "loss": 0.7671, "step": 560 }, { "epoch": 0.5363984674329502, "loss_full_dim": 0.40849336981773376, "loss_main": 0.8347959518432617, "loss_parscale": 0.84765625, "loss_sub_dim": 0.42630261182785034, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.98828125, "step": 560 }, { "epoch": 0.5373563218390804, "grad_norm": 8.87212085723877, "learning_rate": 3.7868421052631584e-06, "loss": 0.8348, "step": 561 }, { "epoch": 0.5373563218390804, "loss_full_dim": 0.3677901327610016, "loss_main": 0.7523661851882935, "loss_parscale": 0.75390625, "loss_sub_dim": 0.38457605242729187, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.98828125, "step": 561 }, { "epoch": 0.5383141762452107, "grad_norm": 9.449320793151855, "learning_rate": 3.7842105263157895e-06, "loss": 0.7524, "step": 562 }, { "epoch": 0.5383141762452107, "loss_full_dim": 0.4186570644378662, "loss_main": 0.8569782972335815, "loss_parscale": 0.859375, "loss_sub_dim": 0.43832123279571533, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98828125, "step": 562 }, { "epoch": 0.539272030651341, "grad_norm": 22.423803329467773, "learning_rate": 3.781578947368421e-06, "loss": 0.857, "step": 563 }, { "epoch": 0.539272030651341, "loss_full_dim": 0.3792080283164978, "loss_main": 0.7757553458213806, "loss_parscale": 0.7734375, "loss_sub_dim": 0.3965473175048828, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.98046875, "step": 563 }, { "epoch": 0.5402298850574713, "grad_norm": 9.004425048828125, "learning_rate": 3.778947368421053e-06, "loss": 0.7758, "step": 564 }, { "epoch": 0.5402298850574713, "loss_full_dim": 0.41585773229599, "loss_main": 0.8508691191673279, "loss_parscale": 0.8515625, "loss_sub_dim": 0.4350113868713379, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.9921875, "step": 564 }, { "epoch": 0.5411877394636015, "grad_norm": 63.230567932128906, "learning_rate": 3.7763157894736847e-06, "loss": 0.8509, "step": 565 }, { "epoch": 0.5411877394636015, "loss_full_dim": 0.37272149324417114, "loss_main": 0.7641438245773315, "loss_parscale": 0.78515625, "loss_sub_dim": 0.3914223313331604, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.96875, "step": 565 }, { "epoch": 0.5421455938697318, "grad_norm": 7.089947700500488, "learning_rate": 3.773684210526316e-06, "loss": 0.7641, "step": 566 }, { "epoch": 0.5421455938697318, "loss_full_dim": 0.3977949321269989, "loss_main": 0.8121960163116455, "loss_parscale": 0.8125, "loss_sub_dim": 0.4144010543823242, "loss_vclub": 0.000732421875, "parscale_sim": 0.984375, "step": 566 }, { "epoch": 0.5431034482758621, "grad_norm": 13.527660369873047, "learning_rate": 3.7710526315789474e-06, "loss": 0.8122, "step": 567 }, { "epoch": 0.5431034482758621, "loss_full_dim": 0.4162103235721588, "loss_main": 0.8498023748397827, "loss_parscale": 0.859375, "loss_sub_dim": 0.4335920512676239, "loss_vclub": 0.000579833984375, "parscale_sim": 0.984375, "step": 567 }, { "epoch": 0.5440613026819924, "grad_norm": 9.530391693115234, "learning_rate": 3.768421052631579e-06, "loss": 0.8498, "step": 568 }, { "epoch": 0.5440613026819924, "loss_full_dim": 0.3596530556678772, "loss_main": 0.7352114915847778, "loss_parscale": 0.75, "loss_sub_dim": 0.37555843591690063, "loss_vclub": 0.000713348388671875, "parscale_sim": 0.98828125, "step": 568 }, { "epoch": 0.5450191570881227, "grad_norm": 6.972066879272461, "learning_rate": 3.765789473684211e-06, "loss": 0.7352, "step": 569 }, { "epoch": 0.5450191570881227, "loss_full_dim": 0.3571784198284149, "loss_main": 0.7284547686576843, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3712763488292694, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.98828125, "step": 569 }, { "epoch": 0.5459770114942529, "grad_norm": 27.7495059967041, "learning_rate": 3.7631578947368426e-06, "loss": 0.7285, "step": 570 }, { "epoch": 0.5459770114942529, "loss_full_dim": 0.3318771421909332, "loss_main": 0.6830415725708008, "loss_parscale": 0.69921875, "loss_sub_dim": 0.35116440057754517, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.98828125, "step": 570 }, { "epoch": 0.5469348659003831, "grad_norm": 9.757909774780273, "learning_rate": 3.7605263157894738e-06, "loss": 0.683, "step": 571 }, { "epoch": 0.5469348659003831, "loss_full_dim": 0.4132184088230133, "loss_main": 0.8453859090805054, "loss_parscale": 0.84375, "loss_sub_dim": 0.43216753005981445, "loss_vclub": 0.000713348388671875, "parscale_sim": 0.98828125, "step": 571 }, { "epoch": 0.5478927203065134, "grad_norm": 9.703629493713379, "learning_rate": 3.7578947368421053e-06, "loss": 0.8454, "step": 572 }, { "epoch": 0.5478927203065134, "loss_full_dim": 0.40355828404426575, "loss_main": 0.8254421353340149, "loss_parscale": 0.828125, "loss_sub_dim": 0.42188385128974915, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.9921875, "step": 572 }, { "epoch": 0.5488505747126436, "grad_norm": 10.033215522766113, "learning_rate": 3.7552631578947374e-06, "loss": 0.8254, "step": 573 }, { "epoch": 0.5488505747126436, "loss_full_dim": 0.34988707304000854, "loss_main": 0.7191184759140015, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3692314326763153, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.984375, "step": 573 }, { "epoch": 0.5498084291187739, "grad_norm": 11.12651252746582, "learning_rate": 3.752631578947369e-06, "loss": 0.7191, "step": 574 }, { "epoch": 0.5498084291187739, "loss_full_dim": 0.36394232511520386, "loss_main": 0.7451034188270569, "loss_parscale": 0.75, "loss_sub_dim": 0.381161093711853, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.98828125, "step": 574 }, { "epoch": 0.5507662835249042, "grad_norm": 10.34914779663086, "learning_rate": 3.7500000000000005e-06, "loss": 0.7451, "step": 575 }, { "epoch": 0.5507662835249042, "loss_full_dim": 0.39223572611808777, "loss_main": 0.8020796775817871, "loss_parscale": 0.8046875, "loss_sub_dim": 0.40984398126602173, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.98828125, "step": 575 }, { "epoch": 0.5517241379310345, "grad_norm": 6.4401702880859375, "learning_rate": 3.7473684210526317e-06, "loss": 0.8021, "step": 576 }, { "epoch": 0.5517241379310345, "loss_full_dim": 0.34866905212402344, "loss_main": 0.7149879932403564, "loss_parscale": 0.7109375, "loss_sub_dim": 0.366318941116333, "loss_vclub": 0.000701904296875, "parscale_sim": 0.98828125, "step": 576 }, { "epoch": 0.5526819923371648, "grad_norm": 11.051721572875977, "learning_rate": 3.7447368421052633e-06, "loss": 0.715, "step": 577 }, { "epoch": 0.5526819923371648, "loss_full_dim": 0.40539753437042236, "loss_main": 0.8267444968223572, "loss_parscale": 0.828125, "loss_sub_dim": 0.4213469624519348, "loss_vclub": 0.000701904296875, "parscale_sim": 0.984375, "step": 577 }, { "epoch": 0.553639846743295, "grad_norm": 20.721498489379883, "learning_rate": 3.7421052631578953e-06, "loss": 0.8267, "step": 578 }, { "epoch": 0.553639846743295, "loss_full_dim": 0.38613930344581604, "loss_main": 0.7936503887176514, "loss_parscale": 0.796875, "loss_sub_dim": 0.4075111150741577, "loss_vclub": 0.000797271728515625, "parscale_sim": 0.9921875, "step": 578 }, { "epoch": 0.5545977011494253, "grad_norm": 6.572969436645508, "learning_rate": 3.739473684210527e-06, "loss": 0.7937, "step": 579 }, { "epoch": 0.5545977011494253, "loss_full_dim": 0.385853111743927, "loss_main": 0.791790246963501, "loss_parscale": 0.77734375, "loss_sub_dim": 0.405937135219574, "loss_vclub": 0.00079345703125, "parscale_sim": 0.98828125, "step": 579 }, { "epoch": 0.5555555555555556, "grad_norm": 8.319478988647461, "learning_rate": 3.736842105263158e-06, "loss": 0.7918, "step": 580 }, { "epoch": 0.5555555555555556, "loss_full_dim": 0.3736950755119324, "loss_main": 0.7650361657142639, "loss_parscale": 0.76171875, "loss_sub_dim": 0.39134109020233154, "loss_vclub": 0.000766754150390625, "parscale_sim": 0.98828125, "step": 580 }, { "epoch": 0.5565134099616859, "grad_norm": 8.994922637939453, "learning_rate": 3.7342105263157896e-06, "loss": 0.765, "step": 581 }, { "epoch": 0.5565134099616859, "loss_full_dim": 0.41554054617881775, "loss_main": 0.851252555847168, "loss_parscale": 0.8515625, "loss_sub_dim": 0.4357120394706726, "loss_vclub": 0.000690460205078125, "parscale_sim": 0.984375, "step": 581 }, { "epoch": 0.5574712643678161, "grad_norm": 8.277159690856934, "learning_rate": 3.7315789473684216e-06, "loss": 0.8513, "step": 582 }, { "epoch": 0.5574712643678161, "loss_full_dim": 0.35676977038383484, "loss_main": 0.7296978235244751, "loss_parscale": 0.7578125, "loss_sub_dim": 0.37292802333831787, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.98828125, "step": 582 }, { "epoch": 0.5584291187739464, "grad_norm": 100.07181549072266, "learning_rate": 3.728947368421053e-06, "loss": 0.7297, "step": 583 }, { "epoch": 0.5584291187739464, "loss_full_dim": 0.32836490869522095, "loss_main": 0.6741928458213806, "loss_parscale": 0.671875, "loss_sub_dim": 0.34582793712615967, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.98828125, "step": 583 }, { "epoch": 0.5593869731800766, "grad_norm": 8.64867115020752, "learning_rate": 3.7263157894736848e-06, "loss": 0.6742, "step": 584 }, { "epoch": 0.5593869731800766, "loss_full_dim": 0.3769546151161194, "loss_main": 0.77303147315979, "loss_parscale": 0.78515625, "loss_sub_dim": 0.39607682824134827, "loss_vclub": 0.000896453857421875, "parscale_sim": 0.9609375, "step": 584 }, { "epoch": 0.5603448275862069, "grad_norm": 14.763797760009766, "learning_rate": 3.723684210526316e-06, "loss": 0.773, "step": 585 }, { "epoch": 0.5603448275862069, "loss_full_dim": 0.3641854226589203, "loss_main": 0.7458138465881348, "loss_parscale": 0.75, "loss_sub_dim": 0.3816283941268921, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98828125, "step": 585 }, { "epoch": 0.5613026819923371, "grad_norm": 12.483150482177734, "learning_rate": 3.7210526315789475e-06, "loss": 0.7458, "step": 586 }, { "epoch": 0.5613026819923371, "loss_full_dim": 0.3767903745174408, "loss_main": 0.7736446857452393, "loss_parscale": 0.765625, "loss_sub_dim": 0.39685434103012085, "loss_vclub": 0.00064849853515625, "parscale_sim": 0.98046875, "step": 586 }, { "epoch": 0.5622605363984674, "grad_norm": 5.412718296051025, "learning_rate": 3.7184210526315795e-06, "loss": 0.7736, "step": 587 }, { "epoch": 0.5622605363984674, "loss_full_dim": 0.3921200633049011, "loss_main": 0.8040615320205688, "loss_parscale": 0.7890625, "loss_sub_dim": 0.4119414687156677, "loss_vclub": 0.00064849853515625, "parscale_sim": 0.9765625, "step": 587 }, { "epoch": 0.5632183908045977, "grad_norm": 8.084800720214844, "learning_rate": 3.715789473684211e-06, "loss": 0.8041, "step": 588 }, { "epoch": 0.5632183908045977, "loss_full_dim": 0.42770445346832275, "loss_main": 0.8762289881706238, "loss_parscale": 0.8828125, "loss_sub_dim": 0.448524534702301, "loss_vclub": 0.000732421875, "parscale_sim": 0.98828125, "step": 588 }, { "epoch": 0.564176245210728, "grad_norm": 11.244412422180176, "learning_rate": 3.7131578947368422e-06, "loss": 0.8762, "step": 589 }, { "epoch": 0.564176245210728, "loss_full_dim": 0.30496731400489807, "loss_main": 0.6236667037010193, "loss_parscale": 0.62109375, "loss_sub_dim": 0.3186993896961212, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.98828125, "step": 589 }, { "epoch": 0.5651340996168582, "grad_norm": 11.547786712646484, "learning_rate": 3.710526315789474e-06, "loss": 0.6237, "step": 590 }, { "epoch": 0.5651340996168582, "loss_full_dim": 0.4197801649570465, "loss_main": 0.8576474189758301, "loss_parscale": 0.85546875, "loss_sub_dim": 0.4378672242164612, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.984375, "step": 590 }, { "epoch": 0.5660919540229885, "grad_norm": 20.094385147094727, "learning_rate": 3.7078947368421054e-06, "loss": 0.8576, "step": 591 }, { "epoch": 0.5660919540229885, "loss_full_dim": 0.3988147974014282, "loss_main": 0.8149283528327942, "loss_parscale": 0.8203125, "loss_sub_dim": 0.41611355543136597, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.98828125, "step": 591 }, { "epoch": 0.5670498084291188, "grad_norm": 8.58596420288086, "learning_rate": 3.7052631578947374e-06, "loss": 0.8149, "step": 592 }, { "epoch": 0.5670498084291188, "loss_full_dim": 0.39256641268730164, "loss_main": 0.8020637631416321, "loss_parscale": 0.8046875, "loss_sub_dim": 0.40949735045433044, "loss_vclub": 0.000713348388671875, "parscale_sim": 0.98828125, "step": 592 }, { "epoch": 0.5680076628352491, "grad_norm": 8.805715560913086, "learning_rate": 3.702631578947369e-06, "loss": 0.8021, "step": 593 }, { "epoch": 0.5680076628352491, "loss_full_dim": 0.39340120553970337, "loss_main": 0.8021652698516846, "loss_parscale": 0.8125, "loss_sub_dim": 0.4087640345096588, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.98828125, "step": 593 }, { "epoch": 0.5689655172413793, "grad_norm": 8.338133811950684, "learning_rate": 3.7e-06, "loss": 0.8022, "step": 594 }, { "epoch": 0.5689655172413793, "loss_full_dim": 0.3676563501358032, "loss_main": 0.7523549199104309, "loss_parscale": 0.7578125, "loss_sub_dim": 0.3846985697746277, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.96875, "step": 594 }, { "epoch": 0.5699233716475096, "grad_norm": 6.730896472930908, "learning_rate": 3.6973684210526317e-06, "loss": 0.7524, "step": 595 }, { "epoch": 0.5699233716475096, "loss_full_dim": 0.4061720073223114, "loss_main": 0.8314781188964844, "loss_parscale": 0.8359375, "loss_sub_dim": 0.42530614137649536, "loss_vclub": 0.0005950927734375, "parscale_sim": 0.984375, "step": 595 }, { "epoch": 0.5708812260536399, "grad_norm": 6.777297496795654, "learning_rate": 3.6947368421052637e-06, "loss": 0.8315, "step": 596 }, { "epoch": 0.5708812260536399, "loss_full_dim": 0.3343586027622223, "loss_main": 0.6856595277786255, "loss_parscale": 0.69140625, "loss_sub_dim": 0.3513009548187256, "loss_vclub": 0.000926971435546875, "parscale_sim": 0.98828125, "step": 596 }, { "epoch": 0.5718390804597702, "grad_norm": 7.930263996124268, "learning_rate": 3.6921052631578953e-06, "loss": 0.6857, "step": 597 }, { "epoch": 0.5718390804597702, "loss_full_dim": 0.3635607063770294, "loss_main": 0.7422827482223511, "loss_parscale": 0.74609375, "loss_sub_dim": 0.37872201204299927, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.98828125, "step": 597 }, { "epoch": 0.5727969348659003, "grad_norm": 6.821435928344727, "learning_rate": 3.6894736842105265e-06, "loss": 0.7423, "step": 598 }, { "epoch": 0.5727969348659003, "loss_full_dim": 0.3355541527271271, "loss_main": 0.6876914501190186, "loss_parscale": 0.6875, "loss_sub_dim": 0.35213732719421387, "loss_vclub": 0.00072479248046875, "parscale_sim": 0.984375, "step": 598 }, { "epoch": 0.5737547892720306, "grad_norm": 7.392444133758545, "learning_rate": 3.686842105263158e-06, "loss": 0.6877, "step": 599 }, { "epoch": 0.5737547892720306, "loss_full_dim": 0.413994699716568, "loss_main": 0.8455986380577087, "loss_parscale": 0.84375, "loss_sub_dim": 0.43160393834114075, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.98828125, "step": 599 }, { "epoch": 0.5747126436781609, "grad_norm": 9.861312866210938, "learning_rate": 3.6842105263157896e-06, "loss": 0.8456, "step": 600 }, { "epoch": 0.5747126436781609, "loss_full_dim": 0.42901960015296936, "loss_main": 0.8774645328521729, "loss_parscale": 0.890625, "loss_sub_dim": 0.4484449625015259, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.98828125, "step": 600 }, { "epoch": 0.5756704980842912, "grad_norm": 9.708776473999023, "learning_rate": 3.6815789473684216e-06, "loss": 0.8775, "step": 601 }, { "epoch": 0.5756704980842912, "loss_full_dim": 0.49078428745269775, "loss_main": 1.0028836727142334, "loss_parscale": 1.0, "loss_sub_dim": 0.5120993852615356, "loss_vclub": 0.00079345703125, "parscale_sim": 0.98828125, "step": 601 }, { "epoch": 0.5766283524904214, "grad_norm": 8.76320743560791, "learning_rate": 3.6789473684210532e-06, "loss": 1.0029, "step": 602 }, { "epoch": 0.5766283524904214, "loss_full_dim": 0.4062999486923218, "loss_main": 0.8297877311706543, "loss_parscale": 0.82421875, "loss_sub_dim": 0.4234877824783325, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.98828125, "step": 602 }, { "epoch": 0.5775862068965517, "grad_norm": 16.673053741455078, "learning_rate": 3.6763157894736844e-06, "loss": 0.8298, "step": 603 }, { "epoch": 0.5775862068965517, "loss_full_dim": 0.38452693819999695, "loss_main": 0.7864630222320557, "loss_parscale": 0.7890625, "loss_sub_dim": 0.40193605422973633, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.98828125, "step": 603 }, { "epoch": 0.578544061302682, "grad_norm": 8.208160400390625, "learning_rate": 3.673684210526316e-06, "loss": 0.7865, "step": 604 }, { "epoch": 0.578544061302682, "loss_full_dim": 0.40884289145469666, "loss_main": 0.8330626487731934, "loss_parscale": 0.828125, "loss_sub_dim": 0.4242197573184967, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.98046875, "step": 604 }, { "epoch": 0.5795019157088123, "grad_norm": 11.186745643615723, "learning_rate": 3.6710526315789476e-06, "loss": 0.8331, "step": 605 }, { "epoch": 0.5795019157088123, "loss_full_dim": 0.3858218789100647, "loss_main": 0.7898447513580322, "loss_parscale": 0.80859375, "loss_sub_dim": 0.40402287244796753, "loss_vclub": 0.000705718994140625, "parscale_sim": 0.98828125, "step": 605 }, { "epoch": 0.5804597701149425, "grad_norm": 5.610227584838867, "learning_rate": 3.6684210526315796e-06, "loss": 0.7898, "step": 606 }, { "epoch": 0.5804597701149425, "loss_full_dim": 0.3668707311153412, "loss_main": 0.750206708908081, "loss_parscale": 0.75390625, "loss_sub_dim": 0.38333597779273987, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.98828125, "step": 606 }, { "epoch": 0.5814176245210728, "grad_norm": 7.061725616455078, "learning_rate": 3.6657894736842107e-06, "loss": 0.7502, "step": 607 }, { "epoch": 0.5814176245210728, "loss_full_dim": 0.35448116064071655, "loss_main": 0.7236437797546387, "loss_parscale": 0.73046875, "loss_sub_dim": 0.3691626191139221, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.98046875, "step": 607 }, { "epoch": 0.5823754789272031, "grad_norm": 7.050046920776367, "learning_rate": 3.6631578947368423e-06, "loss": 0.7236, "step": 608 }, { "epoch": 0.5823754789272031, "loss_full_dim": 0.3727227449417114, "loss_main": 0.7636138200759888, "loss_parscale": 0.7734375, "loss_sub_dim": 0.39089107513427734, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.98828125, "step": 608 }, { "epoch": 0.5833333333333334, "grad_norm": 18.700233459472656, "learning_rate": 3.660526315789474e-06, "loss": 0.7636, "step": 609 }, { "epoch": 0.5833333333333334, "loss_full_dim": 0.43339747190475464, "loss_main": 0.8818596005439758, "loss_parscale": 0.88671875, "loss_sub_dim": 0.4484621286392212, "loss_vclub": 0.000812530517578125, "parscale_sim": 0.98828125, "step": 609 }, { "epoch": 0.5842911877394636, "grad_norm": 9.195364952087402, "learning_rate": 3.657894736842106e-06, "loss": 0.8819, "step": 610 }, { "epoch": 0.5842911877394636, "loss_full_dim": 0.3755834400653839, "loss_main": 0.7676678895950317, "loss_parscale": 0.7734375, "loss_sub_dim": 0.3920844793319702, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.98828125, "step": 610 }, { "epoch": 0.5852490421455939, "grad_norm": 7.468223571777344, "learning_rate": 3.6552631578947375e-06, "loss": 0.7677, "step": 611 }, { "epoch": 0.5852490421455939, "loss_full_dim": 0.3605292737483978, "loss_main": 0.7394759654998779, "loss_parscale": 0.7421875, "loss_sub_dim": 0.3789466619491577, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.984375, "step": 611 }, { "epoch": 0.5862068965517241, "grad_norm": 5.607725143432617, "learning_rate": 3.6526315789473686e-06, "loss": 0.7395, "step": 612 }, { "epoch": 0.5862068965517241, "loss_full_dim": 0.38043212890625, "loss_main": 0.7754331827163696, "loss_parscale": 0.78125, "loss_sub_dim": 0.39500105381011963, "loss_vclub": 0.00083160400390625, "parscale_sim": 0.9765625, "step": 612 }, { "epoch": 0.5871647509578544, "grad_norm": 7.648861885070801, "learning_rate": 3.65e-06, "loss": 0.7754, "step": 613 }, { "epoch": 0.5871647509578544, "loss_full_dim": 0.33986616134643555, "loss_main": 0.6965060234069824, "loss_parscale": 0.703125, "loss_sub_dim": 0.3566398620605469, "loss_vclub": 0.000823974609375, "parscale_sim": 0.984375, "step": 613 }, { "epoch": 0.5881226053639846, "grad_norm": 8.064492225646973, "learning_rate": 3.6473684210526318e-06, "loss": 0.6965, "step": 614 }, { "epoch": 0.5881226053639846, "loss_full_dim": 0.36061498522758484, "loss_main": 0.7377320528030396, "loss_parscale": 0.73828125, "loss_sub_dim": 0.3771170973777771, "loss_vclub": 0.000682830810546875, "parscale_sim": 0.98828125, "step": 614 }, { "epoch": 0.5890804597701149, "grad_norm": 7.867294788360596, "learning_rate": 3.644736842105264e-06, "loss": 0.7377, "step": 615 }, { "epoch": 0.5890804597701149, "loss_full_dim": 0.37691423296928406, "loss_main": 0.7694753408432007, "loss_parscale": 0.76953125, "loss_sub_dim": 0.392561137676239, "loss_vclub": 0.000598907470703125, "parscale_sim": 0.98828125, "step": 615 }, { "epoch": 0.5900383141762452, "grad_norm": 6.5483717918396, "learning_rate": 3.642105263157895e-06, "loss": 0.7695, "step": 616 }, { "epoch": 0.5900383141762452, "loss_full_dim": 0.4145055115222931, "loss_main": 0.8457109928131104, "loss_parscale": 0.8515625, "loss_sub_dim": 0.4312054514884949, "loss_vclub": 0.0006103515625, "parscale_sim": 0.98828125, "step": 616 }, { "epoch": 0.5909961685823755, "grad_norm": 6.012157440185547, "learning_rate": 3.6394736842105265e-06, "loss": 0.8457, "step": 617 }, { "epoch": 0.5909961685823755, "loss_full_dim": 0.4019372761249542, "loss_main": 0.819922685623169, "loss_parscale": 0.828125, "loss_sub_dim": 0.41798537969589233, "loss_vclub": 0.000652313232421875, "parscale_sim": 0.98828125, "step": 617 }, { "epoch": 0.5919540229885057, "grad_norm": 8.520037651062012, "learning_rate": 3.636842105263158e-06, "loss": 0.8199, "step": 618 }, { "epoch": 0.5919540229885057, "loss_full_dim": 0.34308940172195435, "loss_main": 0.701278805732727, "loss_parscale": 0.71484375, "loss_sub_dim": 0.3581894040107727, "loss_vclub": 0.000774383544921875, "parscale_sim": 0.98828125, "step": 618 }, { "epoch": 0.592911877394636, "grad_norm": 9.239031791687012, "learning_rate": 3.6342105263157897e-06, "loss": 0.7013, "step": 619 }, { "epoch": 0.592911877394636, "loss_full_dim": 0.3045141100883484, "loss_main": 0.6224718689918518, "loss_parscale": 0.6171875, "loss_sub_dim": 0.3179577589035034, "loss_vclub": 0.000682830810546875, "parscale_sim": 0.98828125, "step": 619 }, { "epoch": 0.5938697318007663, "grad_norm": 8.798670768737793, "learning_rate": 3.6315789473684217e-06, "loss": 0.6225, "step": 620 }, { "epoch": 0.5938697318007663, "loss_full_dim": 0.37874355912208557, "loss_main": 0.777694821357727, "loss_parscale": 0.7734375, "loss_sub_dim": 0.3989512324333191, "loss_vclub": 0.000774383544921875, "parscale_sim": 0.98828125, "step": 620 }, { "epoch": 0.5948275862068966, "grad_norm": 6.577239513397217, "learning_rate": 3.628947368421053e-06, "loss": 0.7777, "step": 621 }, { "epoch": 0.5948275862068966, "loss_full_dim": 0.35175567865371704, "loss_main": 0.7197355031967163, "loss_parscale": 0.734375, "loss_sub_dim": 0.3679797947406769, "loss_vclub": 0.000606536865234375, "parscale_sim": 0.98828125, "step": 621 }, { "epoch": 0.5957854406130269, "grad_norm": 8.303664207458496, "learning_rate": 3.6263157894736844e-06, "loss": 0.7197, "step": 622 }, { "epoch": 0.5957854406130269, "loss_full_dim": 0.43367141485214233, "loss_main": 0.8843362927436829, "loss_parscale": 0.890625, "loss_sub_dim": 0.4506648778915405, "loss_vclub": 0.000667572021484375, "parscale_sim": 0.98046875, "step": 622 }, { "epoch": 0.5967432950191571, "grad_norm": 8.651481628417969, "learning_rate": 3.623684210526316e-06, "loss": 0.8843, "step": 623 }, { "epoch": 0.5967432950191571, "loss_full_dim": 0.35451072454452515, "loss_main": 0.7273985743522644, "loss_parscale": 0.7265625, "loss_sub_dim": 0.37288784980773926, "loss_vclub": 0.00055694580078125, "parscale_sim": 0.984375, "step": 623 }, { "epoch": 0.5977011494252874, "grad_norm": 6.098386287689209, "learning_rate": 3.621052631578948e-06, "loss": 0.7274, "step": 624 }, { "epoch": 0.5977011494252874, "loss_full_dim": 0.3830614686012268, "loss_main": 0.7811719179153442, "loss_parscale": 0.78125, "loss_sub_dim": 0.39811044931411743, "loss_vclub": 0.000701904296875, "parscale_sim": 0.9921875, "step": 624 }, { "epoch": 0.5986590038314177, "grad_norm": 5.2734880447387695, "learning_rate": 3.618421052631579e-06, "loss": 0.7812, "step": 625 }, { "epoch": 0.5986590038314177, "loss_full_dim": 0.3895306885242462, "loss_main": 0.7965936660766602, "loss_parscale": 0.796875, "loss_sub_dim": 0.40706300735473633, "loss_vclub": 0.000629425048828125, "parscale_sim": 0.98828125, "step": 625 }, { "epoch": 0.5996168582375478, "grad_norm": 9.12495231628418, "learning_rate": 3.6157894736842108e-06, "loss": 0.7966, "step": 626 }, { "epoch": 0.5996168582375478, "loss_full_dim": 0.3625415563583374, "loss_main": 0.7448047399520874, "loss_parscale": 0.7421875, "loss_sub_dim": 0.38226318359375, "loss_vclub": 0.000823974609375, "parscale_sim": 0.9921875, "step": 626 }, { "epoch": 0.6005747126436781, "grad_norm": 7.7561774253845215, "learning_rate": 3.6131578947368424e-06, "loss": 0.7448, "step": 627 }, { "epoch": 0.6005747126436781, "loss_full_dim": 0.30775636434555054, "loss_main": 0.6316295862197876, "loss_parscale": 0.6328125, "loss_sub_dim": 0.32387325167655945, "loss_vclub": 0.00079345703125, "parscale_sim": 0.98828125, "step": 627 }, { "epoch": 0.6015325670498084, "grad_norm": 6.016205787658691, "learning_rate": 3.610526315789474e-06, "loss": 0.6316, "step": 628 }, { "epoch": 0.6015325670498084, "loss_full_dim": 0.37608057260513306, "loss_main": 0.769316554069519, "loss_parscale": 0.765625, "loss_sub_dim": 0.393235981464386, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.98828125, "step": 628 }, { "epoch": 0.6024904214559387, "grad_norm": 6.769039154052734, "learning_rate": 3.607894736842106e-06, "loss": 0.7693, "step": 629 }, { "epoch": 0.6024904214559387, "loss_full_dim": 0.3264373242855072, "loss_main": 0.670752763748169, "loss_parscale": 0.671875, "loss_sub_dim": 0.34431546926498413, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.98828125, "step": 629 }, { "epoch": 0.603448275862069, "grad_norm": 8.537970542907715, "learning_rate": 3.605263157894737e-06, "loss": 0.6708, "step": 630 }, { "epoch": 0.603448275862069, "loss_full_dim": 0.35444653034210205, "loss_main": 0.7283558249473572, "loss_parscale": 0.71875, "loss_sub_dim": 0.3739092946052551, "loss_vclub": 0.00061798095703125, "parscale_sim": 0.98828125, "step": 630 }, { "epoch": 0.6044061302681992, "grad_norm": 9.72378921508789, "learning_rate": 3.6026315789473687e-06, "loss": 0.7284, "step": 631 }, { "epoch": 0.6044061302681992, "loss_full_dim": 0.3693956434726715, "loss_main": 0.7541300654411316, "loss_parscale": 0.7578125, "loss_sub_dim": 0.3847344219684601, "loss_vclub": 0.000640869140625, "parscale_sim": 0.984375, "step": 631 }, { "epoch": 0.6053639846743295, "grad_norm": 6.915194511413574, "learning_rate": 3.6000000000000003e-06, "loss": 0.7541, "step": 632 }, { "epoch": 0.6053639846743295, "loss_full_dim": 0.34886547923088074, "loss_main": 0.7151840925216675, "loss_parscale": 0.7109375, "loss_sub_dim": 0.36631861329078674, "loss_vclub": 0.00067138671875, "parscale_sim": 0.98828125, "step": 632 }, { "epoch": 0.6063218390804598, "grad_norm": 12.071630477905273, "learning_rate": 3.5973684210526314e-06, "loss": 0.7152, "step": 633 }, { "epoch": 0.6063218390804598, "loss_full_dim": 0.377309113740921, "loss_main": 0.7689975500106812, "loss_parscale": 0.78125, "loss_sub_dim": 0.39168840646743774, "loss_vclub": 0.000820159912109375, "parscale_sim": 0.98828125, "step": 633 }, { "epoch": 0.60727969348659, "grad_norm": 7.716428756713867, "learning_rate": 3.5947368421052634e-06, "loss": 0.769, "step": 634 }, { "epoch": 0.60727969348659, "loss_full_dim": 0.38069093227386475, "loss_main": 0.7775954008102417, "loss_parscale": 0.78125, "loss_sub_dim": 0.39690449833869934, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.984375, "step": 634 }, { "epoch": 0.6082375478927203, "grad_norm": 8.86046028137207, "learning_rate": 3.592105263157895e-06, "loss": 0.7776, "step": 635 }, { "epoch": 0.6082375478927203, "loss_full_dim": 0.44749921560287476, "loss_main": 0.9123023748397827, "loss_parscale": 0.921875, "loss_sub_dim": 0.46480318903923035, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.984375, "step": 635 }, { "epoch": 0.6091954022988506, "grad_norm": 8.167008399963379, "learning_rate": 3.5894736842105266e-06, "loss": 0.9123, "step": 636 }, { "epoch": 0.6091954022988506, "loss_full_dim": 0.3738894760608673, "loss_main": 0.7667446136474609, "loss_parscale": 0.7734375, "loss_sub_dim": 0.39285510778427124, "loss_vclub": 0.000583648681640625, "parscale_sim": 0.984375, "step": 636 }, { "epoch": 0.6101532567049809, "grad_norm": 9.643288612365723, "learning_rate": 3.586842105263158e-06, "loss": 0.7667, "step": 637 }, { "epoch": 0.6101532567049809, "loss_full_dim": 0.3674898147583008, "loss_main": 0.7544536590576172, "loss_parscale": 0.7578125, "loss_sub_dim": 0.3869638442993164, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.98828125, "step": 637 }, { "epoch": 0.6111111111111112, "grad_norm": 11.781011581420898, "learning_rate": 3.58421052631579e-06, "loss": 0.7545, "step": 638 }, { "epoch": 0.6111111111111112, "loss_full_dim": 0.42799466848373413, "loss_main": 0.8748005032539368, "loss_parscale": 0.8828125, "loss_sub_dim": 0.44680583477020264, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.9765625, "step": 638 }, { "epoch": 0.6120689655172413, "grad_norm": 47.356781005859375, "learning_rate": 3.5815789473684213e-06, "loss": 0.8748, "step": 639 }, { "epoch": 0.6120689655172413, "loss_full_dim": 0.37664031982421875, "loss_main": 0.7700567245483398, "loss_parscale": 0.7734375, "loss_sub_dim": 0.3934163749217987, "loss_vclub": 0.000621795654296875, "parscale_sim": 0.98828125, "step": 639 }, { "epoch": 0.6130268199233716, "grad_norm": 5.0274977684021, "learning_rate": 3.578947368421053e-06, "loss": 0.7701, "step": 640 }, { "epoch": 0.6130268199233716, "loss_full_dim": 0.3306906819343567, "loss_main": 0.6803011894226074, "loss_parscale": 0.68359375, "loss_sub_dim": 0.34961050748825073, "loss_vclub": 0.00064849853515625, "parscale_sim": 0.984375, "step": 640 }, { "epoch": 0.6139846743295019, "grad_norm": 7.3341169357299805, "learning_rate": 3.5763157894736845e-06, "loss": 0.6803, "step": 641 }, { "epoch": 0.6139846743295019, "loss_full_dim": 0.38578546047210693, "loss_main": 0.7877669930458069, "loss_parscale": 0.7890625, "loss_sub_dim": 0.40198153257369995, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.98828125, "step": 641 }, { "epoch": 0.6149425287356322, "grad_norm": 10.04371166229248, "learning_rate": 3.5736842105263157e-06, "loss": 0.7878, "step": 642 }, { "epoch": 0.6149425287356322, "loss_full_dim": 0.40235623717308044, "loss_main": 0.8239575624465942, "loss_parscale": 0.828125, "loss_sub_dim": 0.4216012954711914, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98828125, "step": 642 }, { "epoch": 0.6159003831417624, "grad_norm": 737.8432006835938, "learning_rate": 3.571052631578948e-06, "loss": 0.824, "step": 643 }, { "epoch": 0.6159003831417624, "loss_full_dim": 0.37617796659469604, "loss_main": 0.7678096890449524, "loss_parscale": 0.765625, "loss_sub_dim": 0.39163172245025635, "loss_vclub": 0.000705718994140625, "parscale_sim": 0.984375, "step": 643 }, { "epoch": 0.6168582375478927, "grad_norm": 9.844654083251953, "learning_rate": 3.5684210526315792e-06, "loss": 0.7678, "step": 644 }, { "epoch": 0.6168582375478927, "loss_full_dim": 0.46482017636299133, "loss_main": 0.9480472803115845, "loss_parscale": 0.9765625, "loss_sub_dim": 0.48322707414627075, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.98828125, "step": 644 }, { "epoch": 0.617816091954023, "grad_norm": 7.224414348602295, "learning_rate": 3.565789473684211e-06, "loss": 0.948, "step": 645 }, { "epoch": 0.617816091954023, "loss_full_dim": 0.4094318449497223, "loss_main": 0.8378751277923584, "loss_parscale": 0.83984375, "loss_sub_dim": 0.4284432530403137, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.98828125, "step": 645 }, { "epoch": 0.6187739463601533, "grad_norm": 95.70195770263672, "learning_rate": 3.5631578947368424e-06, "loss": 0.8379, "step": 646 }, { "epoch": 0.6187739463601533, "loss_full_dim": 0.3916766047477722, "loss_main": 0.8044508695602417, "loss_parscale": 0.8125, "loss_sub_dim": 0.4127742350101471, "loss_vclub": 0.000774383544921875, "parscale_sim": 0.98046875, "step": 646 }, { "epoch": 0.6197318007662835, "grad_norm": 8.41223430633545, "learning_rate": 3.5605263157894736e-06, "loss": 0.8045, "step": 647 }, { "epoch": 0.6197318007662835, "loss_full_dim": 0.42553597688674927, "loss_main": 0.8768475651741028, "loss_parscale": 0.875, "loss_sub_dim": 0.4513115882873535, "loss_vclub": 0.00079345703125, "parscale_sim": 0.9609375, "step": 647 }, { "epoch": 0.6206896551724138, "grad_norm": 6.600493907928467, "learning_rate": 3.5578947368421056e-06, "loss": 0.8768, "step": 648 }, { "epoch": 0.6206896551724138, "loss_full_dim": 0.4116237759590149, "loss_main": 0.8431026935577393, "loss_parscale": 0.84375, "loss_sub_dim": 0.43147894740104675, "loss_vclub": 0.000606536865234375, "parscale_sim": 0.98828125, "step": 648 }, { "epoch": 0.6216475095785441, "grad_norm": 80.52225494384766, "learning_rate": 3.555263157894737e-06, "loss": 0.8431, "step": 649 }, { "epoch": 0.6216475095785441, "loss_full_dim": 0.4589002728462219, "loss_main": 0.9359846115112305, "loss_parscale": 0.92578125, "loss_sub_dim": 0.47708433866500854, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.9609375, "step": 649 }, { "epoch": 0.6226053639846744, "grad_norm": 8.910249710083008, "learning_rate": 3.5526315789473687e-06, "loss": 0.936, "step": 650 }, { "epoch": 0.6226053639846744, "loss_full_dim": 0.41864654421806335, "loss_main": 0.8566197156906128, "loss_parscale": 0.8671875, "loss_sub_dim": 0.43797314167022705, "loss_vclub": 0.000713348388671875, "parscale_sim": 0.98828125, "step": 650 }, { "epoch": 0.6235632183908046, "grad_norm": 7.23588228225708, "learning_rate": 3.5500000000000003e-06, "loss": 0.8566, "step": 651 }, { "epoch": 0.6235632183908046, "loss_full_dim": 0.4360385835170746, "loss_main": 0.8937052488327026, "loss_parscale": 0.8984375, "loss_sub_dim": 0.45766666531562805, "loss_vclub": 0.0005950927734375, "parscale_sim": 0.9921875, "step": 651 }, { "epoch": 0.6245210727969349, "grad_norm": 6.044622898101807, "learning_rate": 3.5473684210526323e-06, "loss": 0.8937, "step": 652 }, { "epoch": 0.6245210727969349, "loss_full_dim": 0.3791128098964691, "loss_main": 0.7813546657562256, "loss_parscale": 0.77734375, "loss_sub_dim": 0.40224185585975647, "loss_vclub": 0.00091552734375, "parscale_sim": 0.98828125, "step": 652 }, { "epoch": 0.6254789272030651, "grad_norm": 9.055522918701172, "learning_rate": 3.5447368421052635e-06, "loss": 0.7814, "step": 653 }, { "epoch": 0.6254789272030651, "loss_full_dim": 0.38967809081077576, "loss_main": 0.7966306209564209, "loss_parscale": 0.80859375, "loss_sub_dim": 0.40695255994796753, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98828125, "step": 653 }, { "epoch": 0.6264367816091954, "grad_norm": 8.26673698425293, "learning_rate": 3.542105263157895e-06, "loss": 0.7966, "step": 654 }, { "epoch": 0.6264367816091954, "loss_full_dim": 0.3654250204563141, "loss_main": 0.7511687278747559, "loss_parscale": 0.74609375, "loss_sub_dim": 0.38574373722076416, "loss_vclub": 0.000820159912109375, "parscale_sim": 0.98828125, "step": 654 }, { "epoch": 0.6273946360153256, "grad_norm": 8.552175521850586, "learning_rate": 3.5394736842105266e-06, "loss": 0.7512, "step": 655 }, { "epoch": 0.6273946360153256, "loss_full_dim": 0.37584373354911804, "loss_main": 0.7734447717666626, "loss_parscale": 0.77734375, "loss_sub_dim": 0.39760103821754456, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.98828125, "step": 655 }, { "epoch": 0.6283524904214559, "grad_norm": 6.5405097007751465, "learning_rate": 3.536842105263158e-06, "loss": 0.7734, "step": 656 }, { "epoch": 0.6283524904214559, "loss_full_dim": 0.362912118434906, "loss_main": 0.7439122200012207, "loss_parscale": 0.765625, "loss_sub_dim": 0.3810001015663147, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.984375, "step": 656 }, { "epoch": 0.6293103448275862, "grad_norm": 7.742701530456543, "learning_rate": 3.53421052631579e-06, "loss": 0.7439, "step": 657 }, { "epoch": 0.6293103448275862, "loss_full_dim": 0.38433676958084106, "loss_main": 0.7854261994361877, "loss_parscale": 0.78125, "loss_sub_dim": 0.4010894298553467, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.98828125, "step": 657 }, { "epoch": 0.6302681992337165, "grad_norm": 20.530805587768555, "learning_rate": 3.5315789473684214e-06, "loss": 0.7854, "step": 658 }, { "epoch": 0.6302681992337165, "loss_full_dim": 0.4051019847393036, "loss_main": 0.8268929719924927, "loss_parscale": 0.828125, "loss_sub_dim": 0.4217909574508667, "loss_vclub": 0.0006103515625, "parscale_sim": 0.98828125, "step": 658 }, { "epoch": 0.6312260536398467, "grad_norm": 9.170215606689453, "learning_rate": 3.528947368421053e-06, "loss": 0.8269, "step": 659 }, { "epoch": 0.6312260536398467, "loss_full_dim": 0.32692041993141174, "loss_main": 0.6748608350753784, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3479404151439667, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.98828125, "step": 659 }, { "epoch": 0.632183908045977, "grad_norm": 24.804521560668945, "learning_rate": 3.5263157894736846e-06, "loss": 0.6749, "step": 660 }, { "epoch": 0.632183908045977, "loss_full_dim": 0.3500936031341553, "loss_main": 0.716692328453064, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3665987551212311, "loss_vclub": 0.000667572021484375, "parscale_sim": 0.98046875, "step": 660 }, { "epoch": 0.6331417624521073, "grad_norm": 8.422623634338379, "learning_rate": 3.5236842105263157e-06, "loss": 0.7167, "step": 661 }, { "epoch": 0.6331417624521073, "loss_full_dim": 0.4495907127857208, "loss_main": 0.9171713590621948, "loss_parscale": 0.9140625, "loss_sub_dim": 0.4675806164741516, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98828125, "step": 661 }, { "epoch": 0.6340996168582376, "grad_norm": 6.829285621643066, "learning_rate": 3.5210526315789477e-06, "loss": 0.9172, "step": 662 }, { "epoch": 0.6340996168582376, "loss_full_dim": 0.38358116149902344, "loss_main": 0.7836158871650696, "loss_parscale": 0.78515625, "loss_sub_dim": 0.40003472566604614, "loss_vclub": 0.00058746337890625, "parscale_sim": 0.984375, "step": 662 }, { "epoch": 0.6350574712643678, "grad_norm": 9.006641387939453, "learning_rate": 3.5184210526315793e-06, "loss": 0.7836, "step": 663 }, { "epoch": 0.6350574712643678, "loss_full_dim": 0.43741998076438904, "loss_main": 0.8953244686126709, "loss_parscale": 0.890625, "loss_sub_dim": 0.45790451765060425, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.96484375, "step": 663 }, { "epoch": 0.6360153256704981, "grad_norm": 6.877085208892822, "learning_rate": 3.515789473684211e-06, "loss": 0.8953, "step": 664 }, { "epoch": 0.6360153256704981, "loss_full_dim": 0.3455687463283539, "loss_main": 0.7086609601974487, "loss_parscale": 0.71875, "loss_sub_dim": 0.36309224367141724, "loss_vclub": 0.000804901123046875, "parscale_sim": 0.984375, "step": 664 }, { "epoch": 0.6369731800766284, "grad_norm": 7.461938381195068, "learning_rate": 3.513157894736842e-06, "loss": 0.7087, "step": 665 }, { "epoch": 0.6369731800766284, "loss_full_dim": 0.41512659192085266, "loss_main": 0.8477782011032104, "loss_parscale": 0.84765625, "loss_sub_dim": 0.4326516091823578, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.9921875, "step": 665 }, { "epoch": 0.6379310344827587, "grad_norm": 6.940959930419922, "learning_rate": 3.510526315789474e-06, "loss": 0.8478, "step": 666 }, { "epoch": 0.6379310344827587, "loss_full_dim": 0.35328617691993713, "loss_main": 0.7246911525726318, "loss_parscale": 0.7421875, "loss_sub_dim": 0.3714050054550171, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.98828125, "step": 666 }, { "epoch": 0.6388888888888888, "grad_norm": 12.387791633605957, "learning_rate": 3.5078947368421056e-06, "loss": 0.7247, "step": 667 }, { "epoch": 0.6388888888888888, "loss_full_dim": 0.38207462430000305, "loss_main": 0.7831108570098877, "loss_parscale": 0.7734375, "loss_sub_dim": 0.40103623270988464, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.984375, "step": 667 }, { "epoch": 0.6398467432950191, "grad_norm": 13.372007369995117, "learning_rate": 3.505263157894737e-06, "loss": 0.7831, "step": 668 }, { "epoch": 0.6398467432950191, "loss_full_dim": 0.342801958322525, "loss_main": 0.7007765769958496, "loss_parscale": 0.703125, "loss_sub_dim": 0.357974648475647, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.984375, "step": 668 }, { "epoch": 0.6408045977011494, "grad_norm": 7.884926795959473, "learning_rate": 3.502631578947369e-06, "loss": 0.7008, "step": 669 }, { "epoch": 0.6408045977011494, "loss_full_dim": 0.3415779769420624, "loss_main": 0.7019186019897461, "loss_parscale": 0.71875, "loss_sub_dim": 0.36034059524536133, "loss_vclub": 0.00058746337890625, "parscale_sim": 0.98828125, "step": 669 }, { "epoch": 0.6417624521072797, "grad_norm": 15.414067268371582, "learning_rate": 3.5e-06, "loss": 0.7019, "step": 670 }, { "epoch": 0.6417624521072797, "loss_full_dim": 0.30076295137405396, "loss_main": 0.6195588111877441, "loss_parscale": 0.640625, "loss_sub_dim": 0.3187958598136902, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.984375, "step": 670 }, { "epoch": 0.64272030651341, "grad_norm": 12.826836585998535, "learning_rate": 3.497368421052632e-06, "loss": 0.6196, "step": 671 }, { "epoch": 0.64272030651341, "loss_full_dim": 0.3479505777359009, "loss_main": 0.7154622077941895, "loss_parscale": 0.71875, "loss_sub_dim": 0.3675116300582886, "loss_vclub": 0.000885009765625, "parscale_sim": 0.98828125, "step": 671 }, { "epoch": 0.6436781609195402, "grad_norm": 9.429525375366211, "learning_rate": 3.4947368421052635e-06, "loss": 0.7155, "step": 672 }, { "epoch": 0.6436781609195402, "loss_full_dim": 0.39929914474487305, "loss_main": 0.8155978322029114, "loss_parscale": 0.8125, "loss_sub_dim": 0.41629868745803833, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.98828125, "step": 672 }, { "epoch": 0.6446360153256705, "grad_norm": 13.930412292480469, "learning_rate": 3.492105263157895e-06, "loss": 0.8156, "step": 673 }, { "epoch": 0.6446360153256705, "loss_full_dim": 0.3861931264400482, "loss_main": 0.7870795726776123, "loss_parscale": 0.80078125, "loss_sub_dim": 0.4008864760398865, "loss_vclub": 0.0005340576171875, "parscale_sim": 0.98828125, "step": 673 }, { "epoch": 0.6455938697318008, "grad_norm": 7.4572882652282715, "learning_rate": 3.4894736842105263e-06, "loss": 0.7871, "step": 674 }, { "epoch": 0.6455938697318008, "loss_full_dim": 0.4106043577194214, "loss_main": 0.8413838744163513, "loss_parscale": 0.83203125, "loss_sub_dim": 0.43077951669692993, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.98828125, "step": 674 }, { "epoch": 0.646551724137931, "grad_norm": 6.58626651763916, "learning_rate": 3.486842105263158e-06, "loss": 0.8414, "step": 675 }, { "epoch": 0.646551724137931, "loss_full_dim": 0.33586838841438293, "loss_main": 0.6885675191879272, "loss_parscale": 0.68359375, "loss_sub_dim": 0.3526991307735443, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98828125, "step": 675 }, { "epoch": 0.6475095785440613, "grad_norm": 8.520795822143555, "learning_rate": 3.48421052631579e-06, "loss": 0.6886, "step": 676 }, { "epoch": 0.6475095785440613, "loss_full_dim": 0.3459956645965576, "loss_main": 0.7082948684692383, "loss_parscale": 0.7109375, "loss_sub_dim": 0.3622991740703583, "loss_vclub": 0.000774383544921875, "parscale_sim": 0.984375, "step": 676 }, { "epoch": 0.6484674329501916, "grad_norm": 6.5044331550598145, "learning_rate": 3.4815789473684214e-06, "loss": 0.7083, "step": 677 }, { "epoch": 0.6484674329501916, "loss_full_dim": 0.3320862650871277, "loss_main": 0.6836618185043335, "loss_parscale": 0.69921875, "loss_sub_dim": 0.3515755534172058, "loss_vclub": 0.000713348388671875, "parscale_sim": 0.98828125, "step": 677 }, { "epoch": 0.6494252873563219, "grad_norm": 7.972768783569336, "learning_rate": 3.478947368421053e-06, "loss": 0.6837, "step": 678 }, { "epoch": 0.6494252873563219, "loss_full_dim": 0.3367515206336975, "loss_main": 0.688400149345398, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3516486585140228, "loss_vclub": 0.000667572021484375, "parscale_sim": 0.98828125, "step": 678 }, { "epoch": 0.6503831417624522, "grad_norm": 21.9426326751709, "learning_rate": 3.476315789473684e-06, "loss": 0.6884, "step": 679 }, { "epoch": 0.6503831417624522, "loss_full_dim": 0.37176743149757385, "loss_main": 0.7594293355941772, "loss_parscale": 0.7734375, "loss_sub_dim": 0.387661874294281, "loss_vclub": 0.000507354736328125, "parscale_sim": 0.98828125, "step": 679 }, { "epoch": 0.6513409961685823, "grad_norm": 7.565419673919678, "learning_rate": 3.473684210526316e-06, "loss": 0.7594, "step": 680 }, { "epoch": 0.6513409961685823, "loss_full_dim": 0.4062742292881012, "loss_main": 0.8332991600036621, "loss_parscale": 0.82421875, "loss_sub_dim": 0.4270249605178833, "loss_vclub": 0.000667572021484375, "parscale_sim": 0.98046875, "step": 680 }, { "epoch": 0.6522988505747126, "grad_norm": 9.901589393615723, "learning_rate": 3.4710526315789478e-06, "loss": 0.8333, "step": 681 }, { "epoch": 0.6522988505747126, "loss_full_dim": 0.3416685461997986, "loss_main": 0.7004766464233398, "loss_parscale": 0.703125, "loss_sub_dim": 0.35880810022354126, "loss_vclub": 0.000614166259765625, "parscale_sim": 0.984375, "step": 681 }, { "epoch": 0.6532567049808429, "grad_norm": 6.50786828994751, "learning_rate": 3.4684210526315794e-06, "loss": 0.7005, "step": 682 }, { "epoch": 0.6532567049808429, "loss_full_dim": 0.4060927927494049, "loss_main": 0.8290061950683594, "loss_parscale": 0.8203125, "loss_sub_dim": 0.4229133725166321, "loss_vclub": 0.000720977783203125, "parscale_sim": 0.98828125, "step": 682 }, { "epoch": 0.6542145593869731, "grad_norm": 6.8023529052734375, "learning_rate": 3.4657894736842105e-06, "loss": 0.829, "step": 683 }, { "epoch": 0.6542145593869731, "loss_full_dim": 0.36702653765678406, "loss_main": 0.7504749298095703, "loss_parscale": 0.75, "loss_sub_dim": 0.38344839215278625, "loss_vclub": 0.000644683837890625, "parscale_sim": 0.98828125, "step": 683 }, { "epoch": 0.6551724137931034, "grad_norm": 15.033411979675293, "learning_rate": 3.463157894736842e-06, "loss": 0.7505, "step": 684 }, { "epoch": 0.6551724137931034, "loss_full_dim": 0.3140878975391388, "loss_main": 0.6433349847793579, "loss_parscale": 0.65234375, "loss_sub_dim": 0.32924705743789673, "loss_vclub": 0.000667572021484375, "parscale_sim": 0.98828125, "step": 684 }, { "epoch": 0.6561302681992337, "grad_norm": 11.756685256958008, "learning_rate": 3.460526315789474e-06, "loss": 0.6433, "step": 685 }, { "epoch": 0.6561302681992337, "loss_full_dim": 0.34399616718292236, "loss_main": 0.7049688100814819, "loss_parscale": 0.7109375, "loss_sub_dim": 0.3609726130962372, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.96484375, "step": 685 }, { "epoch": 0.657088122605364, "grad_norm": 7.646183967590332, "learning_rate": 3.4578947368421057e-06, "loss": 0.705, "step": 686 }, { "epoch": 0.657088122605364, "loss_full_dim": 0.3898676037788391, "loss_main": 0.7989562749862671, "loss_parscale": 0.8046875, "loss_sub_dim": 0.40908870100975037, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.984375, "step": 686 }, { "epoch": 0.6580459770114943, "grad_norm": 10.833155632019043, "learning_rate": 3.4552631578947373e-06, "loss": 0.799, "step": 687 }, { "epoch": 0.6580459770114943, "loss_full_dim": 0.36072075366973877, "loss_main": 0.7377711534500122, "loss_parscale": 0.74609375, "loss_sub_dim": 0.3770504295825958, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.98828125, "step": 687 }, { "epoch": 0.6590038314176245, "grad_norm": 8.125412940979004, "learning_rate": 3.4526315789473684e-06, "loss": 0.7378, "step": 688 }, { "epoch": 0.6590038314176245, "loss_full_dim": 0.3586362302303314, "loss_main": 0.7327041625976562, "loss_parscale": 0.734375, "loss_sub_dim": 0.37406790256500244, "loss_vclub": 0.000690460205078125, "parscale_sim": 0.9921875, "step": 688 }, { "epoch": 0.6599616858237548, "grad_norm": 6.585686206817627, "learning_rate": 3.45e-06, "loss": 0.7327, "step": 689 }, { "epoch": 0.6599616858237548, "loss_full_dim": 0.38002997636795044, "loss_main": 0.7761666178703308, "loss_parscale": 0.78125, "loss_sub_dim": 0.39613664150238037, "loss_vclub": 0.00081634521484375, "parscale_sim": 0.98828125, "step": 689 }, { "epoch": 0.6609195402298851, "grad_norm": 6.495802879333496, "learning_rate": 3.447368421052632e-06, "loss": 0.7762, "step": 690 }, { "epoch": 0.6609195402298851, "loss_full_dim": 0.35055986046791077, "loss_main": 0.7161433696746826, "loss_parscale": 0.71875, "loss_sub_dim": 0.36558347940444946, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.984375, "step": 690 }, { "epoch": 0.6618773946360154, "grad_norm": 7.337845802307129, "learning_rate": 3.4447368421052636e-06, "loss": 0.7161, "step": 691 }, { "epoch": 0.6618773946360154, "loss_full_dim": 0.36405330896377563, "loss_main": 0.7454806566238403, "loss_parscale": 0.75, "loss_sub_dim": 0.3814273476600647, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.98828125, "step": 691 }, { "epoch": 0.6628352490421456, "grad_norm": 12.520709037780762, "learning_rate": 3.4421052631578947e-06, "loss": 0.7455, "step": 692 }, { "epoch": 0.6628352490421456, "loss_full_dim": 0.37593546509742737, "loss_main": 0.7681820392608643, "loss_parscale": 0.76953125, "loss_sub_dim": 0.3922466039657593, "loss_vclub": 0.000823974609375, "parscale_sim": 0.98828125, "step": 692 }, { "epoch": 0.6637931034482759, "grad_norm": 13.093415260314941, "learning_rate": 3.4394736842105263e-06, "loss": 0.7682, "step": 693 }, { "epoch": 0.6637931034482759, "loss_full_dim": 0.4038117825984955, "loss_main": 0.8254109621047974, "loss_parscale": 0.8359375, "loss_sub_dim": 0.42159920930862427, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.984375, "step": 693 }, { "epoch": 0.6647509578544061, "grad_norm": 7.556214809417725, "learning_rate": 3.4368421052631583e-06, "loss": 0.8254, "step": 694 }, { "epoch": 0.6647509578544061, "loss_full_dim": 0.3547059893608093, "loss_main": 0.7252997756004333, "loss_parscale": 0.73828125, "loss_sub_dim": 0.370593786239624, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.96484375, "step": 694 }, { "epoch": 0.6657088122605364, "grad_norm": 15.479902267456055, "learning_rate": 3.43421052631579e-06, "loss": 0.7253, "step": 695 }, { "epoch": 0.6657088122605364, "loss_full_dim": 0.3563348948955536, "loss_main": 0.7303295135498047, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3739945888519287, "loss_vclub": 0.000843048095703125, "parscale_sim": 0.98828125, "step": 695 }, { "epoch": 0.6666666666666666, "grad_norm": 10.095793724060059, "learning_rate": 3.4315789473684215e-06, "loss": 0.7303, "step": 696 }, { "epoch": 0.6666666666666666, "loss_full_dim": 0.3358292281627655, "loss_main": 0.6884044408798218, "loss_parscale": 0.6796875, "loss_sub_dim": 0.35257524251937866, "loss_vclub": 0.000789642333984375, "parscale_sim": 0.98828125, "step": 696 }, { "epoch": 0.6676245210727969, "grad_norm": 5.973373889923096, "learning_rate": 3.4289473684210527e-06, "loss": 0.6884, "step": 697 }, { "epoch": 0.6676245210727969, "loss_full_dim": 0.3747398555278778, "loss_main": 0.7672826051712036, "loss_parscale": 0.765625, "loss_sub_dim": 0.3925427198410034, "loss_vclub": 0.000782012939453125, "parscale_sim": 0.98828125, "step": 697 }, { "epoch": 0.6685823754789272, "grad_norm": 9.625094413757324, "learning_rate": 3.4263157894736842e-06, "loss": 0.7673, "step": 698 }, { "epoch": 0.6685823754789272, "loss_full_dim": 0.361211359500885, "loss_main": 0.7394975423812866, "loss_parscale": 0.7421875, "loss_sub_dim": 0.3782861828804016, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.98828125, "step": 698 }, { "epoch": 0.6695402298850575, "grad_norm": 9.792860984802246, "learning_rate": 3.4236842105263162e-06, "loss": 0.7395, "step": 699 }, { "epoch": 0.6695402298850575, "loss_full_dim": 0.3969326317310333, "loss_main": 0.811667799949646, "loss_parscale": 0.8125, "loss_sub_dim": 0.41473516821861267, "loss_vclub": 0.000606536865234375, "parscale_sim": 0.984375, "step": 699 }, { "epoch": 0.6704980842911877, "grad_norm": 8.506646156311035, "learning_rate": 3.421052631578948e-06, "loss": 0.8117, "step": 700 }, { "epoch": 0.6704980842911877, "loss_full_dim": 0.3781275749206543, "loss_main": 0.7729290723800659, "loss_parscale": 0.7734375, "loss_sub_dim": 0.3948014974594116, "loss_vclub": 0.00072479248046875, "parscale_sim": 0.98828125, "step": 700 }, { "epoch": 0.671455938697318, "grad_norm": 10.224783897399902, "learning_rate": 3.418421052631579e-06, "loss": 0.7729, "step": 701 }, { "epoch": 0.671455938697318, "loss_full_dim": 0.331767737865448, "loss_main": 0.6805902123451233, "loss_parscale": 0.6875, "loss_sub_dim": 0.3488224744796753, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.98828125, "step": 701 }, { "epoch": 0.6724137931034483, "grad_norm": 5.3285017013549805, "learning_rate": 3.4157894736842106e-06, "loss": 0.6806, "step": 702 }, { "epoch": 0.6724137931034483, "loss_full_dim": 0.34197166562080383, "loss_main": 0.6990185976028442, "loss_parscale": 0.6875, "loss_sub_dim": 0.357046902179718, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.984375, "step": 702 }, { "epoch": 0.6733716475095786, "grad_norm": 10.266390800476074, "learning_rate": 3.413157894736842e-06, "loss": 0.699, "step": 703 }, { "epoch": 0.6733716475095786, "loss_full_dim": 0.3412066102027893, "loss_main": 0.6991812586784363, "loss_parscale": 0.7109375, "loss_sub_dim": 0.357974648475647, "loss_vclub": 0.000690460205078125, "parscale_sim": 0.984375, "step": 703 }, { "epoch": 0.6743295019157088, "grad_norm": 9.011483192443848, "learning_rate": 3.410526315789474e-06, "loss": 0.6992, "step": 704 }, { "epoch": 0.6743295019157088, "loss_full_dim": 0.3533942699432373, "loss_main": 0.7245076298713684, "loss_parscale": 0.72265625, "loss_sub_dim": 0.3711133599281311, "loss_vclub": 0.000682830810546875, "parscale_sim": 0.98046875, "step": 704 }, { "epoch": 0.6752873563218391, "grad_norm": 7.464562892913818, "learning_rate": 3.4078947368421057e-06, "loss": 0.7245, "step": 705 }, { "epoch": 0.6752873563218391, "loss_full_dim": 0.3651576042175293, "loss_main": 0.7498793005943298, "loss_parscale": 0.7578125, "loss_sub_dim": 0.38472169637680054, "loss_vclub": 0.0005950927734375, "parscale_sim": 0.98828125, "step": 705 }, { "epoch": 0.6762452107279694, "grad_norm": 8.348101615905762, "learning_rate": 3.405263157894737e-06, "loss": 0.7499, "step": 706 }, { "epoch": 0.6762452107279694, "loss_full_dim": 0.378921777009964, "loss_main": 0.7817250490188599, "loss_parscale": 0.7890625, "loss_sub_dim": 0.40280330181121826, "loss_vclub": 0.000682830810546875, "parscale_sim": 0.98828125, "step": 706 }, { "epoch": 0.6772030651340997, "grad_norm": 6.642910957336426, "learning_rate": 3.4026315789473685e-06, "loss": 0.7817, "step": 707 }, { "epoch": 0.6772030651340997, "loss_full_dim": 0.4290948510169983, "loss_main": 0.8743246793746948, "loss_parscale": 0.87890625, "loss_sub_dim": 0.44522982835769653, "loss_vclub": 0.000720977783203125, "parscale_sim": 0.98046875, "step": 707 }, { "epoch": 0.6781609195402298, "grad_norm": 7.717892169952393, "learning_rate": 3.4000000000000005e-06, "loss": 0.8743, "step": 708 }, { "epoch": 0.6781609195402298, "loss_full_dim": 0.3429861068725586, "loss_main": 0.704389214515686, "loss_parscale": 0.7109375, "loss_sub_dim": 0.36140313744544983, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98828125, "step": 708 }, { "epoch": 0.6791187739463601, "grad_norm": 6.720066547393799, "learning_rate": 3.397368421052632e-06, "loss": 0.7044, "step": 709 }, { "epoch": 0.6791187739463601, "loss_full_dim": 0.35892102122306824, "loss_main": 0.7389011383056641, "loss_parscale": 0.75, "loss_sub_dim": 0.3799801170825958, "loss_vclub": 0.000640869140625, "parscale_sim": 0.984375, "step": 709 }, { "epoch": 0.6800766283524904, "grad_norm": 10.380602836608887, "learning_rate": 3.3947368421052636e-06, "loss": 0.7389, "step": 710 }, { "epoch": 0.6800766283524904, "loss_full_dim": 0.41322505474090576, "loss_main": 0.8459407687187195, "loss_parscale": 0.84375, "loss_sub_dim": 0.4327157139778137, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.98828125, "step": 710 }, { "epoch": 0.6810344827586207, "grad_norm": 8.37010669708252, "learning_rate": 3.392105263157895e-06, "loss": 0.8459, "step": 711 }, { "epoch": 0.6810344827586207, "loss_full_dim": 0.35125860571861267, "loss_main": 0.7194243669509888, "loss_parscale": 0.73828125, "loss_sub_dim": 0.3681657612323761, "loss_vclub": 0.000732421875, "parscale_sim": 0.98828125, "step": 711 }, { "epoch": 0.6819923371647509, "grad_norm": 7.7574334144592285, "learning_rate": 3.3894736842105264e-06, "loss": 0.7194, "step": 712 }, { "epoch": 0.6819923371647509, "loss_full_dim": 0.4200282692909241, "loss_main": 0.8603829145431519, "loss_parscale": 0.875, "loss_sub_dim": 0.4403546452522278, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.9921875, "step": 712 }, { "epoch": 0.6829501915708812, "grad_norm": 10.606945991516113, "learning_rate": 3.3868421052631584e-06, "loss": 0.8604, "step": 713 }, { "epoch": 0.6829501915708812, "loss_full_dim": 0.35591912269592285, "loss_main": 0.7311740517616272, "loss_parscale": 0.72265625, "loss_sub_dim": 0.37525492906570435, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.98828125, "step": 713 }, { "epoch": 0.6839080459770115, "grad_norm": 8.318496704101562, "learning_rate": 3.38421052631579e-06, "loss": 0.7312, "step": 714 }, { "epoch": 0.6839080459770115, "loss_full_dim": 0.4192562997341156, "loss_main": 0.8564820289611816, "loss_parscale": 0.859375, "loss_sub_dim": 0.4372257590293884, "loss_vclub": 0.000823974609375, "parscale_sim": 0.984375, "step": 714 }, { "epoch": 0.6848659003831418, "grad_norm": 14.334474563598633, "learning_rate": 3.381578947368421e-06, "loss": 0.8565, "step": 715 }, { "epoch": 0.6848659003831418, "loss_full_dim": 0.43208619952201843, "loss_main": 0.8880373239517212, "loss_parscale": 0.89453125, "loss_sub_dim": 0.45595115423202515, "loss_vclub": 0.000644683837890625, "parscale_sim": 0.98046875, "step": 715 }, { "epoch": 0.685823754789272, "grad_norm": 8.7576265335083, "learning_rate": 3.3789473684210527e-06, "loss": 0.888, "step": 716 }, { "epoch": 0.685823754789272, "loss_full_dim": 0.3396463394165039, "loss_main": 0.6985732913017273, "loss_parscale": 0.72265625, "loss_sub_dim": 0.3589269518852234, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.98828125, "step": 716 }, { "epoch": 0.6867816091954023, "grad_norm": 7.664742469787598, "learning_rate": 3.3763157894736843e-06, "loss": 0.6986, "step": 717 }, { "epoch": 0.6867816091954023, "loss_full_dim": 0.4221315383911133, "loss_main": 0.8694269061088562, "loss_parscale": 0.8828125, "loss_sub_dim": 0.4472953677177429, "loss_vclub": 0.000614166259765625, "parscale_sim": 0.98828125, "step": 717 }, { "epoch": 0.6877394636015326, "grad_norm": 7.91140604019165, "learning_rate": 3.3736842105263163e-06, "loss": 0.8694, "step": 718 }, { "epoch": 0.6877394636015326, "loss_full_dim": 0.40751156210899353, "loss_main": 0.8325203657150269, "loss_parscale": 0.8359375, "loss_sub_dim": 0.42500877380371094, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.98828125, "step": 718 }, { "epoch": 0.6886973180076629, "grad_norm": 21.66642189025879, "learning_rate": 3.371052631578948e-06, "loss": 0.8325, "step": 719 }, { "epoch": 0.6886973180076629, "loss_full_dim": 0.3858703672885895, "loss_main": 0.7907639741897583, "loss_parscale": 0.8046875, "loss_sub_dim": 0.4048936367034912, "loss_vclub": 0.000881195068359375, "parscale_sim": 0.98828125, "step": 719 }, { "epoch": 0.6896551724137931, "grad_norm": 5.652876377105713, "learning_rate": 3.368421052631579e-06, "loss": 0.7908, "step": 720 }, { "epoch": 0.6896551724137931, "loss_full_dim": 0.400865763425827, "loss_main": 0.8198204040527344, "loss_parscale": 0.8203125, "loss_sub_dim": 0.41895467042922974, "loss_vclub": 0.000652313232421875, "parscale_sim": 0.9765625, "step": 720 }, { "epoch": 0.6906130268199234, "grad_norm": 10.016226768493652, "learning_rate": 3.3657894736842106e-06, "loss": 0.8198, "step": 721 }, { "epoch": 0.6906130268199234, "loss_full_dim": 0.4133625328540802, "loss_main": 0.8424787521362305, "loss_parscale": 0.84375, "loss_sub_dim": 0.42911621928215027, "loss_vclub": 0.0004825592041015625, "parscale_sim": 0.984375, "step": 721 }, { "epoch": 0.6915708812260536, "grad_norm": 20.094451904296875, "learning_rate": 3.3631578947368426e-06, "loss": 0.8425, "step": 722 }, { "epoch": 0.6915708812260536, "loss_full_dim": 0.38048264384269714, "loss_main": 0.7781673073768616, "loss_parscale": 0.78125, "loss_sub_dim": 0.39768466353416443, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.98046875, "step": 722 }, { "epoch": 0.6925287356321839, "grad_norm": 5.5275983810424805, "learning_rate": 3.360526315789474e-06, "loss": 0.7782, "step": 723 }, { "epoch": 0.6925287356321839, "loss_full_dim": 0.46949949860572815, "loss_main": 0.9592869877815247, "loss_parscale": 0.98046875, "loss_sub_dim": 0.4897874891757965, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.98828125, "step": 723 }, { "epoch": 0.6934865900383141, "grad_norm": 39.33779525756836, "learning_rate": 3.3578947368421054e-06, "loss": 0.9593, "step": 724 }, { "epoch": 0.6934865900383141, "loss_full_dim": 0.35905104875564575, "loss_main": 0.7364293932914734, "loss_parscale": 0.7421875, "loss_sub_dim": 0.37737834453582764, "loss_vclub": 0.000667572021484375, "parscale_sim": 0.984375, "step": 724 }, { "epoch": 0.6944444444444444, "grad_norm": 7.166776657104492, "learning_rate": 3.355263157894737e-06, "loss": 0.7364, "step": 725 }, { "epoch": 0.6944444444444444, "loss_full_dim": 0.3597618043422699, "loss_main": 0.7391419410705566, "loss_parscale": 0.75, "loss_sub_dim": 0.37938010692596436, "loss_vclub": 0.000782012939453125, "parscale_sim": 0.984375, "step": 725 }, { "epoch": 0.6954022988505747, "grad_norm": 8.375383377075195, "learning_rate": 3.3526315789473685e-06, "loss": 0.7391, "step": 726 }, { "epoch": 0.6954022988505747, "loss_full_dim": 0.4320880174636841, "loss_main": 0.8828896880149841, "loss_parscale": 0.8828125, "loss_sub_dim": 0.45080167055130005, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.98828125, "step": 726 }, { "epoch": 0.696360153256705, "grad_norm": 8.720915794372559, "learning_rate": 3.3500000000000005e-06, "loss": 0.8829, "step": 727 }, { "epoch": 0.696360153256705, "loss_full_dim": 0.33927181363105774, "loss_main": 0.6968182325363159, "loss_parscale": 0.703125, "loss_sub_dim": 0.3575463891029358, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.984375, "step": 727 }, { "epoch": 0.6973180076628352, "grad_norm": 6.794954299926758, "learning_rate": 3.347368421052632e-06, "loss": 0.6968, "step": 728 }, { "epoch": 0.6973180076628352, "loss_full_dim": 0.42647165060043335, "loss_main": 0.8732032775878906, "loss_parscale": 0.8671875, "loss_sub_dim": 0.4467315971851349, "loss_vclub": 0.0006103515625, "parscale_sim": 0.98828125, "step": 728 }, { "epoch": 0.6982758620689655, "grad_norm": 14.35696029663086, "learning_rate": 3.3447368421052633e-06, "loss": 0.8732, "step": 729 }, { "epoch": 0.6982758620689655, "loss_full_dim": 0.38248008489608765, "loss_main": 0.7839491963386536, "loss_parscale": 0.7890625, "loss_sub_dim": 0.4014691114425659, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.98828125, "step": 729 }, { "epoch": 0.6992337164750958, "grad_norm": 17.094144821166992, "learning_rate": 3.342105263157895e-06, "loss": 0.7839, "step": 730 }, { "epoch": 0.6992337164750958, "loss_full_dim": 0.357968807220459, "loss_main": 0.7301003932952881, "loss_parscale": 0.7421875, "loss_sub_dim": 0.3721315860748291, "loss_vclub": 0.000881195068359375, "parscale_sim": 0.9921875, "step": 730 }, { "epoch": 0.7001915708812261, "grad_norm": 6.7278852462768555, "learning_rate": 3.3394736842105264e-06, "loss": 0.7301, "step": 731 }, { "epoch": 0.7001915708812261, "loss_full_dim": 0.40725937485694885, "loss_main": 0.8338544368743896, "loss_parscale": 0.8359375, "loss_sub_dim": 0.4265950918197632, "loss_vclub": 0.000843048095703125, "parscale_sim": 0.98046875, "step": 731 }, { "epoch": 0.7011494252873564, "grad_norm": 20.440279006958008, "learning_rate": 3.3368421052631584e-06, "loss": 0.8339, "step": 732 }, { "epoch": 0.7011494252873564, "loss_full_dim": 0.3662302792072296, "loss_main": 0.7509365081787109, "loss_parscale": 0.7734375, "loss_sub_dim": 0.38470619916915894, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.98828125, "step": 732 }, { "epoch": 0.7021072796934866, "grad_norm": 8.15213680267334, "learning_rate": 3.3342105263157896e-06, "loss": 0.7509, "step": 733 }, { "epoch": 0.7021072796934866, "loss_full_dim": 0.3307819068431854, "loss_main": 0.6795156002044678, "loss_parscale": 0.6953125, "loss_sub_dim": 0.34873372316360474, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.984375, "step": 733 }, { "epoch": 0.7030651340996169, "grad_norm": 9.682537078857422, "learning_rate": 3.331578947368421e-06, "loss": 0.6795, "step": 734 }, { "epoch": 0.7030651340996169, "loss_full_dim": 0.3883688151836395, "loss_main": 0.7983404994010925, "loss_parscale": 0.8046875, "loss_sub_dim": 0.409971684217453, "loss_vclub": 0.000823974609375, "parscale_sim": 0.984375, "step": 734 }, { "epoch": 0.7040229885057471, "grad_norm": 35.52913284301758, "learning_rate": 3.3289473684210528e-06, "loss": 0.7983, "step": 735 }, { "epoch": 0.7040229885057471, "loss_full_dim": 0.36248794198036194, "loss_main": 0.7441411018371582, "loss_parscale": 0.7578125, "loss_sub_dim": 0.3816531300544739, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98828125, "step": 735 }, { "epoch": 0.7049808429118773, "grad_norm": 15.38346004486084, "learning_rate": 3.3263157894736848e-06, "loss": 0.7441, "step": 736 }, { "epoch": 0.7049808429118773, "loss_full_dim": 0.3449156880378723, "loss_main": 0.7100434899330139, "loss_parscale": 0.71484375, "loss_sub_dim": 0.3651278018951416, "loss_vclub": 0.000637054443359375, "parscale_sim": 0.9921875, "step": 736 }, { "epoch": 0.7059386973180076, "grad_norm": 11.406737327575684, "learning_rate": 3.3236842105263164e-06, "loss": 0.71, "step": 737 }, { "epoch": 0.7059386973180076, "loss_full_dim": 0.3990878760814667, "loss_main": 0.8217262625694275, "loss_parscale": 0.828125, "loss_sub_dim": 0.4226383864879608, "loss_vclub": 0.000522613525390625, "parscale_sim": 0.96484375, "step": 737 }, { "epoch": 0.7068965517241379, "grad_norm": 44.84303283691406, "learning_rate": 3.3210526315789475e-06, "loss": 0.8217, "step": 738 }, { "epoch": 0.7068965517241379, "loss_full_dim": 0.4398984909057617, "loss_main": 0.901033878326416, "loss_parscale": 0.8828125, "loss_sub_dim": 0.4611354172229767, "loss_vclub": 0.000667572021484375, "parscale_sim": 0.98046875, "step": 738 }, { "epoch": 0.7078544061302682, "grad_norm": 11.984313011169434, "learning_rate": 3.318421052631579e-06, "loss": 0.901, "step": 739 }, { "epoch": 0.7078544061302682, "loss_full_dim": 0.36098378896713257, "loss_main": 0.7439538240432739, "loss_parscale": 0.74609375, "loss_sub_dim": 0.38297000527381897, "loss_vclub": 0.000762939453125, "parscale_sim": 0.984375, "step": 739 }, { "epoch": 0.7088122605363985, "grad_norm": 11.272483825683594, "learning_rate": 3.3157894736842107e-06, "loss": 0.744, "step": 740 }, { "epoch": 0.7088122605363985, "loss_full_dim": 0.3312142491340637, "loss_main": 0.6809147596359253, "loss_parscale": 0.69140625, "loss_sub_dim": 0.3497004806995392, "loss_vclub": 0.00079345703125, "parscale_sim": 0.98828125, "step": 740 }, { "epoch": 0.7097701149425287, "grad_norm": 8.5563383102417, "learning_rate": 3.3131578947368427e-06, "loss": 0.6809, "step": 741 }, { "epoch": 0.7097701149425287, "loss_full_dim": 0.39221465587615967, "loss_main": 0.8058713674545288, "loss_parscale": 0.79296875, "loss_sub_dim": 0.41365674138069153, "loss_vclub": 0.000675201416015625, "parscale_sim": 0.98828125, "step": 741 }, { "epoch": 0.710727969348659, "grad_norm": 6.927759647369385, "learning_rate": 3.310526315789474e-06, "loss": 0.8059, "step": 742 }, { "epoch": 0.710727969348659, "loss_full_dim": 0.4416637122631073, "loss_main": 0.9041416645050049, "loss_parscale": 0.8984375, "loss_sub_dim": 0.46247798204421997, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.984375, "step": 742 }, { "epoch": 0.7116858237547893, "grad_norm": 6.590476036071777, "learning_rate": 3.3078947368421054e-06, "loss": 0.9041, "step": 743 }, { "epoch": 0.7116858237547893, "loss_full_dim": 0.4099084734916687, "loss_main": 0.8380734324455261, "loss_parscale": 0.82421875, "loss_sub_dim": 0.4281649589538574, "loss_vclub": 0.000762939453125, "parscale_sim": 0.9921875, "step": 743 }, { "epoch": 0.7126436781609196, "grad_norm": 10.020183563232422, "learning_rate": 3.305263157894737e-06, "loss": 0.8381, "step": 744 }, { "epoch": 0.7126436781609196, "loss_full_dim": 0.3845096528530121, "loss_main": 0.7892352342605591, "loss_parscale": 0.78125, "loss_sub_dim": 0.4047255516052246, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.984375, "step": 744 }, { "epoch": 0.7136015325670498, "grad_norm": 6.10109281539917, "learning_rate": 3.302631578947369e-06, "loss": 0.7892, "step": 745 }, { "epoch": 0.7136015325670498, "loss_full_dim": 0.3675553798675537, "loss_main": 0.755120575428009, "loss_parscale": 0.7734375, "loss_sub_dim": 0.3875651955604553, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.98046875, "step": 745 }, { "epoch": 0.7145593869731801, "grad_norm": 7.004367828369141, "learning_rate": 3.3000000000000006e-06, "loss": 0.7551, "step": 746 }, { "epoch": 0.7145593869731801, "loss_full_dim": 0.3819258511066437, "loss_main": 0.7863246202468872, "loss_parscale": 0.7734375, "loss_sub_dim": 0.40439876914024353, "loss_vclub": 0.00052642822265625, "parscale_sim": 0.953125, "step": 746 }, { "epoch": 0.7155172413793104, "grad_norm": 9.161396026611328, "learning_rate": 3.2973684210526318e-06, "loss": 0.7863, "step": 747 }, { "epoch": 0.7155172413793104, "loss_full_dim": 0.36292484402656555, "loss_main": 0.7444798946380615, "loss_parscale": 0.75, "loss_sub_dim": 0.3815550208091736, "loss_vclub": 0.000835418701171875, "parscale_sim": 0.98828125, "step": 747 }, { "epoch": 0.7164750957854407, "grad_norm": 8.429429054260254, "learning_rate": 3.2947368421052633e-06, "loss": 0.7445, "step": 748 }, { "epoch": 0.7164750957854407, "loss_full_dim": 0.3499738276004791, "loss_main": 0.7164838314056396, "loss_parscale": 0.72265625, "loss_sub_dim": 0.3665100038051605, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.98828125, "step": 748 }, { "epoch": 0.7174329501915708, "grad_norm": 7.218719005584717, "learning_rate": 3.292105263157895e-06, "loss": 0.7165, "step": 749 }, { "epoch": 0.7174329501915708, "loss_full_dim": 0.3568890392780304, "loss_main": 0.7316980361938477, "loss_parscale": 0.734375, "loss_sub_dim": 0.37480902671813965, "loss_vclub": 0.00083160400390625, "parscale_sim": 0.9765625, "step": 749 }, { "epoch": 0.7183908045977011, "grad_norm": 8.467309951782227, "learning_rate": 3.289473684210527e-06, "loss": 0.7317, "step": 750 }, { "epoch": 0.7183908045977011, "loss_full_dim": 0.38440465927124023, "loss_main": 0.7833202481269836, "loss_parscale": 0.78125, "loss_sub_dim": 0.3989155888557434, "loss_vclub": 0.0005340576171875, "parscale_sim": 0.98828125, "step": 750 }, { "epoch": 0.7193486590038314, "grad_norm": 8.257121086120605, "learning_rate": 3.286842105263158e-06, "loss": 0.7833, "step": 751 }, { "epoch": 0.7193486590038314, "loss_full_dim": 0.388271301984787, "loss_main": 0.7968193292617798, "loss_parscale": 0.796875, "loss_sub_dim": 0.4085480570793152, "loss_vclub": 0.000720977783203125, "parscale_sim": 0.98828125, "step": 751 }, { "epoch": 0.7203065134099617, "grad_norm": 10.528382301330566, "learning_rate": 3.2842105263157897e-06, "loss": 0.7968, "step": 752 }, { "epoch": 0.7203065134099617, "loss_full_dim": 0.43272632360458374, "loss_main": 0.8843841552734375, "loss_parscale": 0.890625, "loss_sub_dim": 0.45165783166885376, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.95703125, "step": 752 }, { "epoch": 0.7212643678160919, "grad_norm": 10.639019966125488, "learning_rate": 3.2815789473684212e-06, "loss": 0.8844, "step": 753 }, { "epoch": 0.7212643678160919, "loss_full_dim": 0.3538007140159607, "loss_main": 0.7265771627426147, "loss_parscale": 0.734375, "loss_sub_dim": 0.37277647852897644, "loss_vclub": 0.000606536865234375, "parscale_sim": 0.984375, "step": 753 }, { "epoch": 0.7222222222222222, "grad_norm": 9.565054893493652, "learning_rate": 3.278947368421053e-06, "loss": 0.7266, "step": 754 }, { "epoch": 0.7222222222222222, "loss_full_dim": 0.39075037837028503, "loss_main": 0.8024202585220337, "loss_parscale": 0.7890625, "loss_sub_dim": 0.41166988015174866, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.9765625, "step": 754 }, { "epoch": 0.7231800766283525, "grad_norm": 8.024005889892578, "learning_rate": 3.276315789473685e-06, "loss": 0.8024, "step": 755 }, { "epoch": 0.7231800766283525, "loss_full_dim": 0.4148763120174408, "loss_main": 0.847590446472168, "loss_parscale": 0.8515625, "loss_sub_dim": 0.4327141046524048, "loss_vclub": 0.000713348388671875, "parscale_sim": 0.96875, "step": 755 }, { "epoch": 0.7241379310344828, "grad_norm": 6.829841136932373, "learning_rate": 3.273684210526316e-06, "loss": 0.8476, "step": 756 }, { "epoch": 0.7241379310344828, "loss_full_dim": 0.42481347918510437, "loss_main": 0.8712465167045593, "loss_parscale": 0.88671875, "loss_sub_dim": 0.44643303751945496, "loss_vclub": 0.000629425048828125, "parscale_sim": 0.98828125, "step": 756 }, { "epoch": 0.725095785440613, "grad_norm": 7.294730186462402, "learning_rate": 3.2710526315789476e-06, "loss": 0.8712, "step": 757 }, { "epoch": 0.725095785440613, "loss_full_dim": 0.4144469201564789, "loss_main": 0.8468756079673767, "loss_parscale": 0.84765625, "loss_sub_dim": 0.4324286878108978, "loss_vclub": 0.000644683837890625, "parscale_sim": 0.98046875, "step": 757 }, { "epoch": 0.7260536398467433, "grad_norm": 8.321752548217773, "learning_rate": 3.268421052631579e-06, "loss": 0.8469, "step": 758 }, { "epoch": 0.7260536398467433, "loss_full_dim": 0.3716268837451935, "loss_main": 0.7601298689842224, "loss_parscale": 0.76171875, "loss_sub_dim": 0.38850298523902893, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.98828125, "step": 758 }, { "epoch": 0.7270114942528736, "grad_norm": 27.52883529663086, "learning_rate": 3.265789473684211e-06, "loss": 0.7601, "step": 759 }, { "epoch": 0.7270114942528736, "loss_full_dim": 0.3851022720336914, "loss_main": 0.7882940769195557, "loss_parscale": 0.7890625, "loss_sub_dim": 0.40319180488586426, "loss_vclub": 0.000812530517578125, "parscale_sim": 0.98828125, "step": 759 }, { "epoch": 0.7279693486590039, "grad_norm": 11.661402702331543, "learning_rate": 3.2631578947368423e-06, "loss": 0.7883, "step": 760 }, { "epoch": 0.7279693486590039, "loss_full_dim": 0.43263447284698486, "loss_main": 0.8821297883987427, "loss_parscale": 0.8828125, "loss_sub_dim": 0.4494953155517578, "loss_vclub": 0.0008392333984375, "parscale_sim": 0.98828125, "step": 760 }, { "epoch": 0.7289272030651341, "grad_norm": 8.398256301879883, "learning_rate": 3.260526315789474e-06, "loss": 0.8821, "step": 761 }, { "epoch": 0.7289272030651341, "loss_full_dim": 0.37487930059432983, "loss_main": 0.766431450843811, "loss_parscale": 0.7578125, "loss_sub_dim": 0.3915521204471588, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.98046875, "step": 761 }, { "epoch": 0.7298850574712644, "grad_norm": 7.830564498901367, "learning_rate": 3.2578947368421055e-06, "loss": 0.7664, "step": 762 }, { "epoch": 0.7298850574712644, "loss_full_dim": 0.2888449430465698, "loss_main": 0.5906187295913696, "loss_parscale": 0.59765625, "loss_sub_dim": 0.3017737865447998, "loss_vclub": 0.00055694580078125, "parscale_sim": 0.9765625, "step": 762 }, { "epoch": 0.7308429118773946, "grad_norm": 6.937254428863525, "learning_rate": 3.255263157894737e-06, "loss": 0.5906, "step": 763 }, { "epoch": 0.7308429118773946, "loss_full_dim": 0.36195558309555054, "loss_main": 0.7412332892417908, "loss_parscale": 0.7421875, "loss_sub_dim": 0.37927770614624023, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.98828125, "step": 763 }, { "epoch": 0.7318007662835249, "grad_norm": 9.175363540649414, "learning_rate": 3.252631578947369e-06, "loss": 0.7412, "step": 764 }, { "epoch": 0.7318007662835249, "loss_full_dim": 0.3726154863834381, "loss_main": 0.7623854875564575, "loss_parscale": 0.76953125, "loss_sub_dim": 0.3897700309753418, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.98828125, "step": 764 }, { "epoch": 0.7327586206896551, "grad_norm": 6.316338539123535, "learning_rate": 3.2500000000000002e-06, "loss": 0.7624, "step": 765 }, { "epoch": 0.7327586206896551, "loss_full_dim": 0.38089367747306824, "loss_main": 0.7804234027862549, "loss_parscale": 0.7890625, "loss_sub_dim": 0.39952975511550903, "loss_vclub": 0.000858306884765625, "parscale_sim": 0.984375, "step": 765 }, { "epoch": 0.7337164750957854, "grad_norm": 8.289268493652344, "learning_rate": 3.247368421052632e-06, "loss": 0.7804, "step": 766 }, { "epoch": 0.7337164750957854, "loss_full_dim": 0.36416059732437134, "loss_main": 0.7440589666366577, "loss_parscale": 0.73828125, "loss_sub_dim": 0.37989839911460876, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.98828125, "step": 766 }, { "epoch": 0.7346743295019157, "grad_norm": 6.402018070220947, "learning_rate": 3.2447368421052634e-06, "loss": 0.7441, "step": 767 }, { "epoch": 0.7346743295019157, "loss_full_dim": 0.37678462266921997, "loss_main": 0.7709611654281616, "loss_parscale": 0.765625, "loss_sub_dim": 0.39417654275894165, "loss_vclub": 0.00079345703125, "parscale_sim": 0.984375, "step": 767 }, { "epoch": 0.735632183908046, "grad_norm": 57.464439392089844, "learning_rate": 3.2421052631578945e-06, "loss": 0.771, "step": 768 }, { "epoch": 0.735632183908046, "loss_full_dim": 0.3748184144496918, "loss_main": 0.7682278752326965, "loss_parscale": 0.77734375, "loss_sub_dim": 0.39340946078300476, "loss_vclub": 0.00079345703125, "parscale_sim": 0.98828125, "step": 768 }, { "epoch": 0.7365900383141762, "grad_norm": 14.551556587219238, "learning_rate": 3.239473684210527e-06, "loss": 0.7682, "step": 769 }, { "epoch": 0.7365900383141762, "loss_full_dim": 0.3279408812522888, "loss_main": 0.6723395586013794, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3443986475467682, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.984375, "step": 769 }, { "epoch": 0.7375478927203065, "grad_norm": 7.488635540008545, "learning_rate": 3.236842105263158e-06, "loss": 0.6723, "step": 770 }, { "epoch": 0.7375478927203065, "loss_full_dim": 0.3305681049823761, "loss_main": 0.6786375045776367, "loss_parscale": 0.68359375, "loss_sub_dim": 0.348069429397583, "loss_vclub": 0.0006103515625, "parscale_sim": 0.984375, "step": 770 }, { "epoch": 0.7385057471264368, "grad_norm": 7.789098262786865, "learning_rate": 3.2342105263157897e-06, "loss": 0.6786, "step": 771 }, { "epoch": 0.7385057471264368, "loss_full_dim": 0.3816453814506531, "loss_main": 0.7830426096916199, "loss_parscale": 0.796875, "loss_sub_dim": 0.4013972282409668, "loss_vclub": 0.000759124755859375, "parscale_sim": 0.98828125, "step": 771 }, { "epoch": 0.7394636015325671, "grad_norm": 5.757874011993408, "learning_rate": 3.2315789473684213e-06, "loss": 0.783, "step": 772 }, { "epoch": 0.7394636015325671, "loss_full_dim": 0.36190181970596313, "loss_main": 0.7412213683128357, "loss_parscale": 0.75, "loss_sub_dim": 0.37931954860687256, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.98828125, "step": 772 }, { "epoch": 0.7404214559386973, "grad_norm": 10.239150047302246, "learning_rate": 3.2289473684210533e-06, "loss": 0.7412, "step": 773 }, { "epoch": 0.7404214559386973, "loss_full_dim": 0.37116673588752747, "loss_main": 0.7617790699005127, "loss_parscale": 0.7578125, "loss_sub_dim": 0.3906123638153076, "loss_vclub": 0.000743865966796875, "parscale_sim": 0.984375, "step": 773 }, { "epoch": 0.7413793103448276, "grad_norm": 9.332578659057617, "learning_rate": 3.2263157894736845e-06, "loss": 0.7618, "step": 774 }, { "epoch": 0.7413793103448276, "loss_full_dim": 0.3922003507614136, "loss_main": 0.8052269220352173, "loss_parscale": 0.8203125, "loss_sub_dim": 0.4130265712738037, "loss_vclub": 0.00067138671875, "parscale_sim": 0.9921875, "step": 774 }, { "epoch": 0.7423371647509579, "grad_norm": 13.2467679977417, "learning_rate": 3.223684210526316e-06, "loss": 0.8052, "step": 775 }, { "epoch": 0.7423371647509579, "loss_full_dim": 0.36912184953689575, "loss_main": 0.7567237615585327, "loss_parscale": 0.76171875, "loss_sub_dim": 0.38760191202163696, "loss_vclub": 0.00058746337890625, "parscale_sim": 0.98828125, "step": 775 }, { "epoch": 0.7432950191570882, "grad_norm": 8.720891952514648, "learning_rate": 3.2210526315789476e-06, "loss": 0.7567, "step": 776 }, { "epoch": 0.7432950191570882, "loss_full_dim": 0.3910040855407715, "loss_main": 0.806572437286377, "loss_parscale": 0.81640625, "loss_sub_dim": 0.41556835174560547, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98828125, "step": 776 }, { "epoch": 0.7442528735632183, "grad_norm": 8.015515327453613, "learning_rate": 3.218421052631579e-06, "loss": 0.8066, "step": 777 }, { "epoch": 0.7442528735632183, "loss_full_dim": 0.38875633478164673, "loss_main": 0.795663595199585, "loss_parscale": 0.80078125, "loss_sub_dim": 0.40690726041793823, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98046875, "step": 777 }, { "epoch": 0.7452107279693486, "grad_norm": 50.192501068115234, "learning_rate": 3.215789473684211e-06, "loss": 0.7957, "step": 778 }, { "epoch": 0.7452107279693486, "loss_full_dim": 0.39172807335853577, "loss_main": 0.8042851686477661, "loss_parscale": 0.80078125, "loss_sub_dim": 0.41255706548690796, "loss_vclub": 0.00079345703125, "parscale_sim": 0.98828125, "step": 778 }, { "epoch": 0.7461685823754789, "grad_norm": 12.332130432128906, "learning_rate": 3.2131578947368424e-06, "loss": 0.8043, "step": 779 }, { "epoch": 0.7461685823754789, "loss_full_dim": 0.3319788873195648, "loss_main": 0.6853560209274292, "loss_parscale": 0.68359375, "loss_sub_dim": 0.35337716341018677, "loss_vclub": 0.000759124755859375, "parscale_sim": 0.98046875, "step": 779 }, { "epoch": 0.7471264367816092, "grad_norm": 7.163308143615723, "learning_rate": 3.210526315789474e-06, "loss": 0.6854, "step": 780 }, { "epoch": 0.7471264367816092, "loss_full_dim": 0.38141775131225586, "loss_main": 0.7795907258987427, "loss_parscale": 0.78125, "loss_sub_dim": 0.3981730043888092, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.984375, "step": 780 }, { "epoch": 0.7480842911877394, "grad_norm": 27.002727508544922, "learning_rate": 3.2078947368421055e-06, "loss": 0.7796, "step": 781 }, { "epoch": 0.7480842911877394, "loss_full_dim": 0.40373072028160095, "loss_main": 0.8242517709732056, "loss_parscale": 0.83203125, "loss_sub_dim": 0.420521080493927, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.98828125, "step": 781 }, { "epoch": 0.7490421455938697, "grad_norm": 8.101536750793457, "learning_rate": 3.2052631578947367e-06, "loss": 0.8243, "step": 782 }, { "epoch": 0.7490421455938697, "loss_full_dim": 0.419074147939682, "loss_main": 0.853859543800354, "loss_parscale": 0.8515625, "loss_sub_dim": 0.4347854256629944, "loss_vclub": 0.00084686279296875, "parscale_sim": 0.98828125, "step": 782 }, { "epoch": 0.75, "grad_norm": 8.272571563720703, "learning_rate": 3.2026315789473687e-06, "loss": 0.8539, "step": 783 }, { "epoch": 0.75, "loss_full_dim": 0.4003658592700958, "loss_main": 0.8202476501464844, "loss_parscale": 0.8359375, "loss_sub_dim": 0.41988176107406616, "loss_vclub": 0.000759124755859375, "parscale_sim": 0.98828125, "step": 783 }, { "epoch": 0.7509578544061303, "grad_norm": 10.603716850280762, "learning_rate": 3.2000000000000003e-06, "loss": 0.8202, "step": 784 }, { "epoch": 0.7509578544061303, "loss_full_dim": 0.35417401790618896, "loss_main": 0.7279740571975708, "loss_parscale": 0.734375, "loss_sub_dim": 0.37380003929138184, "loss_vclub": 0.000705718994140625, "parscale_sim": 0.98828125, "step": 784 }, { "epoch": 0.7519157088122606, "grad_norm": 16.333202362060547, "learning_rate": 3.197368421052632e-06, "loss": 0.728, "step": 785 }, { "epoch": 0.7519157088122606, "loss_full_dim": 0.33875972032546997, "loss_main": 0.692286491394043, "loss_parscale": 0.6953125, "loss_sub_dim": 0.3535267412662506, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.984375, "step": 785 }, { "epoch": 0.7528735632183908, "grad_norm": 24.493457794189453, "learning_rate": 3.1947368421052634e-06, "loss": 0.6923, "step": 786 }, { "epoch": 0.7528735632183908, "loss_full_dim": 0.35397493839263916, "loss_main": 0.728640615940094, "loss_parscale": 0.73046875, "loss_sub_dim": 0.37466567754745483, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.984375, "step": 786 }, { "epoch": 0.7538314176245211, "grad_norm": 4.785703659057617, "learning_rate": 3.1921052631578954e-06, "loss": 0.7286, "step": 787 }, { "epoch": 0.7538314176245211, "loss_full_dim": 0.3845701217651367, "loss_main": 0.7872799038887024, "loss_parscale": 0.80078125, "loss_sub_dim": 0.4027097821235657, "loss_vclub": 0.000835418701171875, "parscale_sim": 0.984375, "step": 787 }, { "epoch": 0.7547892720306514, "grad_norm": 10.120992660522461, "learning_rate": 3.1894736842105266e-06, "loss": 0.7873, "step": 788 }, { "epoch": 0.7547892720306514, "loss_full_dim": 0.39104363322257996, "loss_main": 0.8030381202697754, "loss_parscale": 0.8125, "loss_sub_dim": 0.4119945168495178, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.9921875, "step": 788 }, { "epoch": 0.7557471264367817, "grad_norm": 10.60330867767334, "learning_rate": 3.186842105263158e-06, "loss": 0.803, "step": 789 }, { "epoch": 0.7557471264367817, "loss_full_dim": 0.3970607817173004, "loss_main": 0.8127645254135132, "loss_parscale": 0.796875, "loss_sub_dim": 0.41570377349853516, "loss_vclub": 0.0008392333984375, "parscale_sim": 0.98828125, "step": 789 }, { "epoch": 0.7567049808429118, "grad_norm": 6.8517560958862305, "learning_rate": 3.1842105263157898e-06, "loss": 0.8128, "step": 790 }, { "epoch": 0.7567049808429118, "loss_full_dim": 0.39031147956848145, "loss_main": 0.7972822189331055, "loss_parscale": 0.796875, "loss_sub_dim": 0.40697070956230164, "loss_vclub": 0.00064849853515625, "parscale_sim": 0.98828125, "step": 790 }, { "epoch": 0.7576628352490421, "grad_norm": 6.95706844329834, "learning_rate": 3.181578947368421e-06, "loss": 0.7973, "step": 791 }, { "epoch": 0.7576628352490421, "loss_full_dim": 0.37776049971580505, "loss_main": 0.7748857736587524, "loss_parscale": 0.78125, "loss_sub_dim": 0.3971252739429474, "loss_vclub": 0.000568389892578125, "parscale_sim": 0.984375, "step": 791 }, { "epoch": 0.7586206896551724, "grad_norm": 7.687861919403076, "learning_rate": 3.178947368421053e-06, "loss": 0.7749, "step": 792 }, { "epoch": 0.7586206896551724, "loss_full_dim": 0.40960991382598877, "loss_main": 0.8411870002746582, "loss_parscale": 0.8515625, "loss_sub_dim": 0.43157705664634705, "loss_vclub": 0.0005950927734375, "parscale_sim": 0.98828125, "step": 792 }, { "epoch": 0.7595785440613027, "grad_norm": 8.048259735107422, "learning_rate": 3.1763157894736845e-06, "loss": 0.8412, "step": 793 }, { "epoch": 0.7595785440613027, "loss_full_dim": 0.38444119691848755, "loss_main": 0.787815511226654, "loss_parscale": 0.796875, "loss_sub_dim": 0.4033743143081665, "loss_vclub": 0.000720977783203125, "parscale_sim": 0.98828125, "step": 793 }, { "epoch": 0.7605363984674329, "grad_norm": 9.19841194152832, "learning_rate": 3.173684210526316e-06, "loss": 0.7878, "step": 794 }, { "epoch": 0.7605363984674329, "loss_full_dim": 0.360301673412323, "loss_main": 0.7369178533554077, "loss_parscale": 0.7421875, "loss_sub_dim": 0.3766161799430847, "loss_vclub": 0.00060272216796875, "parscale_sim": 0.96484375, "step": 794 }, { "epoch": 0.7614942528735632, "grad_norm": 8.614363670349121, "learning_rate": 3.1710526315789477e-06, "loss": 0.7369, "step": 795 }, { "epoch": 0.7614942528735632, "loss_full_dim": 0.3413884937763214, "loss_main": 0.699418306350708, "loss_parscale": 0.703125, "loss_sub_dim": 0.3580298125743866, "loss_vclub": 0.000843048095703125, "parscale_sim": 0.98828125, "step": 795 }, { "epoch": 0.7624521072796935, "grad_norm": 19.495616912841797, "learning_rate": 3.168421052631579e-06, "loss": 0.6994, "step": 796 }, { "epoch": 0.7624521072796935, "loss_full_dim": 0.32830020785331726, "loss_main": 0.6765648126602173, "loss_parscale": 0.6796875, "loss_sub_dim": 0.34826457500457764, "loss_vclub": 0.00072479248046875, "parscale_sim": 0.98828125, "step": 796 }, { "epoch": 0.7634099616858238, "grad_norm": 9.575248718261719, "learning_rate": 3.165789473684211e-06, "loss": 0.6766, "step": 797 }, { "epoch": 0.7634099616858238, "loss_full_dim": 0.2979837656021118, "loss_main": 0.6144860982894897, "loss_parscale": 0.60546875, "loss_sub_dim": 0.31650233268737793, "loss_vclub": 0.0006256103515625, "parscale_sim": 0.98828125, "step": 797 }, { "epoch": 0.764367816091954, "grad_norm": 10.896347999572754, "learning_rate": 3.1631578947368424e-06, "loss": 0.6145, "step": 798 }, { "epoch": 0.764367816091954, "loss_full_dim": 0.36699697375297546, "loss_main": 0.7534278631210327, "loss_parscale": 0.75, "loss_sub_dim": 0.38643085956573486, "loss_vclub": 0.0006256103515625, "parscale_sim": 0.98046875, "step": 798 }, { "epoch": 0.7653256704980843, "grad_norm": 9.898066520690918, "learning_rate": 3.160526315789474e-06, "loss": 0.7534, "step": 799 }, { "epoch": 0.7653256704980843, "loss_full_dim": 0.3428364098072052, "loss_main": 0.7037961483001709, "loss_parscale": 0.7109375, "loss_sub_dim": 0.3609597086906433, "loss_vclub": 0.000759124755859375, "parscale_sim": 0.984375, "step": 799 }, { "epoch": 0.7662835249042146, "grad_norm": 7.71414852142334, "learning_rate": 3.157894736842105e-06, "loss": 0.7038, "step": 800 }, { "epoch": 0.7662835249042146, "loss_full_dim": 0.38282570242881775, "loss_main": 0.783216118812561, "loss_parscale": 0.78515625, "loss_sub_dim": 0.4003903865814209, "loss_vclub": 0.000782012939453125, "parscale_sim": 0.98828125, "step": 800 }, { "epoch": 0.7672413793103449, "grad_norm": 8.194360733032227, "learning_rate": 3.155263157894737e-06, "loss": 0.7832, "step": 801 }, { "epoch": 0.7672413793103449, "loss_full_dim": 0.3464471101760864, "loss_main": 0.7079854607582092, "loss_parscale": 0.71484375, "loss_sub_dim": 0.3615383505821228, "loss_vclub": 0.000583648681640625, "parscale_sim": 0.984375, "step": 801 }, { "epoch": 0.7681992337164751, "grad_norm": 9.856093406677246, "learning_rate": 3.1526315789473688e-06, "loss": 0.708, "step": 802 }, { "epoch": 0.7681992337164751, "loss_full_dim": 0.35673558712005615, "loss_main": 0.7286867499351501, "loss_parscale": 0.734375, "loss_sub_dim": 0.371951162815094, "loss_vclub": 0.000640869140625, "parscale_sim": 0.98046875, "step": 802 }, { "epoch": 0.7691570881226054, "grad_norm": 5.979557037353516, "learning_rate": 3.1500000000000003e-06, "loss": 0.7287, "step": 803 }, { "epoch": 0.7691570881226054, "loss_full_dim": 0.3777161240577698, "loss_main": 0.7760990262031555, "loss_parscale": 0.79296875, "loss_sub_dim": 0.39838290214538574, "loss_vclub": 0.000823974609375, "parscale_sim": 0.984375, "step": 803 }, { "epoch": 0.7701149425287356, "grad_norm": 10.067408561706543, "learning_rate": 3.147368421052632e-06, "loss": 0.7761, "step": 804 }, { "epoch": 0.7701149425287356, "loss_full_dim": 0.34336501359939575, "loss_main": 0.7047150135040283, "loss_parscale": 0.71484375, "loss_sub_dim": 0.36134999990463257, "loss_vclub": 0.000637054443359375, "parscale_sim": 0.984375, "step": 804 }, { "epoch": 0.7710727969348659, "grad_norm": 6.30320930480957, "learning_rate": 3.144736842105263e-06, "loss": 0.7047, "step": 805 }, { "epoch": 0.7710727969348659, "loss_full_dim": 0.3535256087779999, "loss_main": 0.7262726426124573, "loss_parscale": 0.71875, "loss_sub_dim": 0.3727470338344574, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.984375, "step": 805 }, { "epoch": 0.7720306513409961, "grad_norm": 14.291893005371094, "learning_rate": 3.142105263157895e-06, "loss": 0.7263, "step": 806 }, { "epoch": 0.7720306513409961, "loss_full_dim": 0.37384653091430664, "loss_main": 0.7653008699417114, "loss_parscale": 0.7734375, "loss_sub_dim": 0.3914543390274048, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.96875, "step": 806 }, { "epoch": 0.7729885057471264, "grad_norm": 18.635223388671875, "learning_rate": 3.1394736842105267e-06, "loss": 0.7653, "step": 807 }, { "epoch": 0.7729885057471264, "loss_full_dim": 0.37121501564979553, "loss_main": 0.7654800415039062, "loss_parscale": 0.765625, "loss_sub_dim": 0.3942650258541107, "loss_vclub": 0.00081634521484375, "parscale_sim": 0.984375, "step": 807 }, { "epoch": 0.7739463601532567, "grad_norm": 12.262848854064941, "learning_rate": 3.1368421052631582e-06, "loss": 0.7655, "step": 808 }, { "epoch": 0.7739463601532567, "loss_full_dim": 0.33007800579071045, "loss_main": 0.6767109632492065, "loss_parscale": 0.6875, "loss_sub_dim": 0.3466329574584961, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.98046875, "step": 808 }, { "epoch": 0.774904214559387, "grad_norm": 8.532837867736816, "learning_rate": 3.1342105263157894e-06, "loss": 0.6767, "step": 809 }, { "epoch": 0.774904214559387, "loss_full_dim": 0.2943371534347534, "loss_main": 0.6042945981025696, "loss_parscale": 0.6171875, "loss_sub_dim": 0.30995744466781616, "loss_vclub": 0.000701904296875, "parscale_sim": 0.984375, "step": 809 }, { "epoch": 0.7758620689655172, "grad_norm": 11.4840726852417, "learning_rate": 3.131578947368421e-06, "loss": 0.6043, "step": 810 }, { "epoch": 0.7758620689655172, "loss_full_dim": 0.3599211871623993, "loss_main": 0.7371656894683838, "loss_parscale": 0.7421875, "loss_sub_dim": 0.3772444725036621, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.98828125, "step": 810 }, { "epoch": 0.7768199233716475, "grad_norm": 7.437788009643555, "learning_rate": 3.128947368421053e-06, "loss": 0.7372, "step": 811 }, { "epoch": 0.7768199233716475, "loss_full_dim": 0.3089953660964966, "loss_main": 0.6365423202514648, "loss_parscale": 0.640625, "loss_sub_dim": 0.32754695415496826, "loss_vclub": 0.0006103515625, "parscale_sim": 0.984375, "step": 811 }, { "epoch": 0.7777777777777778, "grad_norm": 8.229411125183105, "learning_rate": 3.1263157894736846e-06, "loss": 0.6365, "step": 812 }, { "epoch": 0.7777777777777778, "loss_full_dim": 0.38262873888015747, "loss_main": 0.7839723825454712, "loss_parscale": 0.796875, "loss_sub_dim": 0.4013436436653137, "loss_vclub": 0.00083160400390625, "parscale_sim": 0.96484375, "step": 812 }, { "epoch": 0.7787356321839081, "grad_norm": 9.137152671813965, "learning_rate": 3.123684210526316e-06, "loss": 0.784, "step": 813 }, { "epoch": 0.7787356321839081, "loss_full_dim": 0.3710079789161682, "loss_main": 0.7568399310112, "loss_parscale": 0.7578125, "loss_sub_dim": 0.38583195209503174, "loss_vclub": 0.00058746337890625, "parscale_sim": 0.97265625, "step": 813 }, { "epoch": 0.7796934865900383, "grad_norm": 8.952507019042969, "learning_rate": 3.1210526315789473e-06, "loss": 0.7568, "step": 814 }, { "epoch": 0.7796934865900383, "loss_full_dim": 0.3491477966308594, "loss_main": 0.7138403058052063, "loss_parscale": 0.703125, "loss_sub_dim": 0.3646925091743469, "loss_vclub": 0.00061798095703125, "parscale_sim": 0.98828125, "step": 814 }, { "epoch": 0.7806513409961686, "grad_norm": 8.58908748626709, "learning_rate": 3.1184210526315793e-06, "loss": 0.7138, "step": 815 }, { "epoch": 0.7806513409961686, "loss_full_dim": 0.3725146949291229, "loss_main": 0.7626825571060181, "loss_parscale": 0.765625, "loss_sub_dim": 0.39016789197921753, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.98828125, "step": 815 }, { "epoch": 0.7816091954022989, "grad_norm": 7.2664031982421875, "learning_rate": 3.115789473684211e-06, "loss": 0.7627, "step": 816 }, { "epoch": 0.7816091954022989, "loss_full_dim": 0.4361073076725006, "loss_main": 0.8878037929534912, "loss_parscale": 0.8828125, "loss_sub_dim": 0.451696515083313, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.984375, "step": 816 }, { "epoch": 0.7825670498084292, "grad_norm": 1365.956298828125, "learning_rate": 3.1131578947368425e-06, "loss": 0.8878, "step": 817 }, { "epoch": 0.7825670498084292, "loss_full_dim": 0.3116569221019745, "loss_main": 0.6394515037536621, "loss_parscale": 0.65234375, "loss_sub_dim": 0.32779455184936523, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.984375, "step": 817 }, { "epoch": 0.7835249042145593, "grad_norm": 5.430070400238037, "learning_rate": 3.1105263157894736e-06, "loss": 0.6395, "step": 818 }, { "epoch": 0.7835249042145593, "loss_full_dim": 0.34868448972702026, "loss_main": 0.7132883071899414, "loss_parscale": 0.7109375, "loss_sub_dim": 0.36460381746292114, "loss_vclub": 0.000659942626953125, "parscale_sim": 0.98828125, "step": 818 }, { "epoch": 0.7844827586206896, "grad_norm": 5.827908992767334, "learning_rate": 3.1078947368421052e-06, "loss": 0.7133, "step": 819 }, { "epoch": 0.7844827586206896, "loss_full_dim": 0.3272685110569, "loss_main": 0.6717526912689209, "loss_parscale": 0.6640625, "loss_sub_dim": 0.3444841504096985, "loss_vclub": 0.000774383544921875, "parscale_sim": 0.98828125, "step": 819 }, { "epoch": 0.7854406130268199, "grad_norm": 36.487674713134766, "learning_rate": 3.1052631578947372e-06, "loss": 0.6718, "step": 820 }, { "epoch": 0.7854406130268199, "loss_full_dim": 0.3050040900707245, "loss_main": 0.6228729486465454, "loss_parscale": 0.62109375, "loss_sub_dim": 0.31786882877349854, "loss_vclub": 0.0009307861328125, "parscale_sim": 0.98828125, "step": 820 }, { "epoch": 0.7863984674329502, "grad_norm": 6.342762470245361, "learning_rate": 3.102631578947369e-06, "loss": 0.6229, "step": 821 }, { "epoch": 0.7863984674329502, "loss_full_dim": 0.3334041237831116, "loss_main": 0.681407630443573, "loss_parscale": 0.6875, "loss_sub_dim": 0.3480035066604614, "loss_vclub": 0.000640869140625, "parscale_sim": 0.98828125, "step": 821 }, { "epoch": 0.7873563218390804, "grad_norm": 12.172955513000488, "learning_rate": 3.1000000000000004e-06, "loss": 0.6814, "step": 822 }, { "epoch": 0.7873563218390804, "loss_full_dim": 0.3136068880558014, "loss_main": 0.6433926224708557, "loss_parscale": 0.65625, "loss_sub_dim": 0.3297857344150543, "loss_vclub": 0.000675201416015625, "parscale_sim": 0.984375, "step": 822 }, { "epoch": 0.7883141762452107, "grad_norm": 10.794767379760742, "learning_rate": 3.0973684210526315e-06, "loss": 0.6434, "step": 823 }, { "epoch": 0.7883141762452107, "loss_full_dim": 0.4052444100379944, "loss_main": 0.8258765935897827, "loss_parscale": 0.82421875, "loss_sub_dim": 0.42063218355178833, "loss_vclub": 0.00060272216796875, "parscale_sim": 0.98828125, "step": 823 }, { "epoch": 0.789272030651341, "grad_norm": 13.284801483154297, "learning_rate": 3.094736842105263e-06, "loss": 0.8259, "step": 824 }, { "epoch": 0.789272030651341, "loss_full_dim": 0.39011862874031067, "loss_main": 0.8003398180007935, "loss_parscale": 0.8125, "loss_sub_dim": 0.4102212190628052, "loss_vclub": 0.000762939453125, "parscale_sim": 0.984375, "step": 824 }, { "epoch": 0.7902298850574713, "grad_norm": 9.504220962524414, "learning_rate": 3.092105263157895e-06, "loss": 0.8003, "step": 825 }, { "epoch": 0.7902298850574713, "loss_full_dim": 0.3704507350921631, "loss_main": 0.758926272392273, "loss_parscale": 0.765625, "loss_sub_dim": 0.3884755074977875, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.98828125, "step": 825 }, { "epoch": 0.7911877394636015, "grad_norm": 8.783402442932129, "learning_rate": 3.0894736842105267e-06, "loss": 0.7589, "step": 826 }, { "epoch": 0.7911877394636015, "loss_full_dim": 0.3728996813297272, "loss_main": 0.768376350402832, "loss_parscale": 0.7734375, "loss_sub_dim": 0.39547663927078247, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.9765625, "step": 826 }, { "epoch": 0.7921455938697318, "grad_norm": 6.824539661407471, "learning_rate": 3.086842105263158e-06, "loss": 0.7684, "step": 827 }, { "epoch": 0.7921455938697318, "loss_full_dim": 0.3476874530315399, "loss_main": 0.7108920812606812, "loss_parscale": 0.71484375, "loss_sub_dim": 0.36320459842681885, "loss_vclub": 0.000759124755859375, "parscale_sim": 0.984375, "step": 827 }, { "epoch": 0.7931034482758621, "grad_norm": 9.53125, "learning_rate": 3.0842105263157895e-06, "loss": 0.7109, "step": 828 }, { "epoch": 0.7931034482758621, "loss_full_dim": 0.3427935242652893, "loss_main": 0.7014038562774658, "loss_parscale": 0.69921875, "loss_sub_dim": 0.3586103320121765, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.98046875, "step": 828 }, { "epoch": 0.7940613026819924, "grad_norm": 8.983015060424805, "learning_rate": 3.0815789473684215e-06, "loss": 0.7014, "step": 829 }, { "epoch": 0.7940613026819924, "loss_full_dim": 0.3895237445831299, "loss_main": 0.7985401749610901, "loss_parscale": 0.8046875, "loss_sub_dim": 0.4090164303779602, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.98828125, "step": 829 }, { "epoch": 0.7950191570881227, "grad_norm": 8.5875244140625, "learning_rate": 3.078947368421053e-06, "loss": 0.7985, "step": 830 }, { "epoch": 0.7950191570881227, "loss_full_dim": 0.3625388443470001, "loss_main": 0.7441583871841431, "loss_parscale": 0.75, "loss_sub_dim": 0.38161957263946533, "loss_vclub": 0.000621795654296875, "parscale_sim": 0.984375, "step": 830 }, { "epoch": 0.7959770114942529, "grad_norm": 8.299896240234375, "learning_rate": 3.0763157894736846e-06, "loss": 0.7442, "step": 831 }, { "epoch": 0.7959770114942529, "loss_full_dim": 0.33261728286743164, "loss_main": 0.682502269744873, "loss_parscale": 0.69140625, "loss_sub_dim": 0.3498849868774414, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.984375, "step": 831 }, { "epoch": 0.7969348659003831, "grad_norm": 10.843989372253418, "learning_rate": 3.0736842105263158e-06, "loss": 0.6825, "step": 832 }, { "epoch": 0.7969348659003831, "loss_full_dim": 0.3676666021347046, "loss_main": 0.7556667327880859, "loss_parscale": 0.765625, "loss_sub_dim": 0.38800013065338135, "loss_vclub": 0.00079345703125, "parscale_sim": 0.984375, "step": 832 }, { "epoch": 0.7978927203065134, "grad_norm": 24.26394271850586, "learning_rate": 3.0710526315789474e-06, "loss": 0.7557, "step": 833 }, { "epoch": 0.7978927203065134, "loss_full_dim": 0.328512042760849, "loss_main": 0.6778509616851807, "loss_parscale": 0.6875, "loss_sub_dim": 0.3493388891220093, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.984375, "step": 833 }, { "epoch": 0.7988505747126436, "grad_norm": 6.897339820861816, "learning_rate": 3.0684210526315794e-06, "loss": 0.6779, "step": 834 }, { "epoch": 0.7988505747126436, "loss_full_dim": 0.32657238841056824, "loss_main": 0.6694400906562805, "loss_parscale": 0.6640625, "loss_sub_dim": 0.3428677022457123, "loss_vclub": 0.00089263916015625, "parscale_sim": 0.984375, "step": 834 }, { "epoch": 0.7998084291187739, "grad_norm": 7.193480491638184, "learning_rate": 3.065789473684211e-06, "loss": 0.6694, "step": 835 }, { "epoch": 0.7998084291187739, "loss_full_dim": 0.3356044590473175, "loss_main": 0.6871324181556702, "loss_parscale": 0.6875, "loss_sub_dim": 0.35152795910835266, "loss_vclub": 0.0005950927734375, "parscale_sim": 0.9765625, "step": 835 }, { "epoch": 0.8007662835249042, "grad_norm": 9.82331371307373, "learning_rate": 3.0631578947368425e-06, "loss": 0.6871, "step": 836 }, { "epoch": 0.8007662835249042, "loss_full_dim": 0.3043815493583679, "loss_main": 0.6255244016647339, "loss_parscale": 0.6328125, "loss_sub_dim": 0.32114288210868835, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.9609375, "step": 836 }, { "epoch": 0.8017241379310345, "grad_norm": 5.545530319213867, "learning_rate": 3.0605263157894737e-06, "loss": 0.6255, "step": 837 }, { "epoch": 0.8017241379310345, "loss_full_dim": 0.3104008436203003, "loss_main": 0.634812593460083, "loss_parscale": 0.6328125, "loss_sub_dim": 0.3244117200374603, "loss_vclub": 0.00061798095703125, "parscale_sim": 0.984375, "step": 837 }, { "epoch": 0.8026819923371648, "grad_norm": 6.824638843536377, "learning_rate": 3.0578947368421053e-06, "loss": 0.6348, "step": 838 }, { "epoch": 0.8026819923371648, "loss_full_dim": 0.36217138171195984, "loss_main": 0.7415652275085449, "loss_parscale": 0.75, "loss_sub_dim": 0.37939387559890747, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.9921875, "step": 838 }, { "epoch": 0.803639846743295, "grad_norm": 7.699575424194336, "learning_rate": 3.0552631578947373e-06, "loss": 0.7416, "step": 839 }, { "epoch": 0.803639846743295, "loss_full_dim": 0.3098408281803131, "loss_main": 0.6336972713470459, "loss_parscale": 0.63671875, "loss_sub_dim": 0.3238564729690552, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.96484375, "step": 839 }, { "epoch": 0.8045977011494253, "grad_norm": 5.4642720222473145, "learning_rate": 3.052631578947369e-06, "loss": 0.6337, "step": 840 }, { "epoch": 0.8045977011494253, "loss_full_dim": 0.39832431077957153, "loss_main": 0.8147023916244507, "loss_parscale": 0.80859375, "loss_sub_dim": 0.41637811064720154, "loss_vclub": 0.000583648681640625, "parscale_sim": 0.98828125, "step": 840 }, { "epoch": 0.8055555555555556, "grad_norm": 7.9674835205078125, "learning_rate": 3.05e-06, "loss": 0.8147, "step": 841 }, { "epoch": 0.8055555555555556, "loss_full_dim": 0.36450716853141785, "loss_main": 0.7466917037963867, "loss_parscale": 0.765625, "loss_sub_dim": 0.38218456506729126, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.98828125, "step": 841 }, { "epoch": 0.8065134099616859, "grad_norm": 42.333091735839844, "learning_rate": 3.0473684210526316e-06, "loss": 0.7467, "step": 842 }, { "epoch": 0.8065134099616859, "loss_full_dim": 0.3717806339263916, "loss_main": 0.7609714269638062, "loss_parscale": 0.765625, "loss_sub_dim": 0.38919079303741455, "loss_vclub": 0.000835418701171875, "parscale_sim": 0.984375, "step": 842 }, { "epoch": 0.8074712643678161, "grad_norm": 7.215214729309082, "learning_rate": 3.0447368421052636e-06, "loss": 0.761, "step": 843 }, { "epoch": 0.8074712643678161, "loss_full_dim": 0.30982354283332825, "loss_main": 0.6341785192489624, "loss_parscale": 0.62890625, "loss_sub_dim": 0.32435497641563416, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.984375, "step": 843 }, { "epoch": 0.8084291187739464, "grad_norm": 14.407883644104004, "learning_rate": 3.042105263157895e-06, "loss": 0.6342, "step": 844 }, { "epoch": 0.8084291187739464, "loss_full_dim": 0.35606977343559265, "loss_main": 0.7275522947311401, "loss_parscale": 0.73828125, "loss_sub_dim": 0.3714824914932251, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.98828125, "step": 844 }, { "epoch": 0.8093869731800766, "grad_norm": 10.40653133392334, "learning_rate": 3.0394736842105268e-06, "loss": 0.7276, "step": 845 }, { "epoch": 0.8093869731800766, "loss_full_dim": 0.38466477394104004, "loss_main": 0.7843971252441406, "loss_parscale": 0.78125, "loss_sub_dim": 0.3997323513031006, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98046875, "step": 845 }, { "epoch": 0.8103448275862069, "grad_norm": 7.513747215270996, "learning_rate": 3.036842105263158e-06, "loss": 0.7844, "step": 846 }, { "epoch": 0.8103448275862069, "loss_full_dim": 0.36687561869621277, "loss_main": 0.7507435083389282, "loss_parscale": 0.75390625, "loss_sub_dim": 0.38386785984039307, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.98828125, "step": 846 }, { "epoch": 0.8113026819923371, "grad_norm": 7.967982292175293, "learning_rate": 3.0342105263157895e-06, "loss": 0.7507, "step": 847 }, { "epoch": 0.8113026819923371, "loss_full_dim": 0.3462659418582916, "loss_main": 0.7078100442886353, "loss_parscale": 0.7109375, "loss_sub_dim": 0.361544132232666, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.98828125, "step": 847 }, { "epoch": 0.8122605363984674, "grad_norm": 19.758831024169922, "learning_rate": 3.0315789473684215e-06, "loss": 0.7078, "step": 848 }, { "epoch": 0.8122605363984674, "loss_full_dim": 0.34213101863861084, "loss_main": 0.6982743740081787, "loss_parscale": 0.6953125, "loss_sub_dim": 0.35614338517189026, "loss_vclub": 0.000705718994140625, "parscale_sim": 0.98828125, "step": 848 }, { "epoch": 0.8132183908045977, "grad_norm": 9.059700012207031, "learning_rate": 3.028947368421053e-06, "loss": 0.6983, "step": 849 }, { "epoch": 0.8132183908045977, "loss_full_dim": 0.3854582607746124, "loss_main": 0.7889852523803711, "loss_parscale": 0.80078125, "loss_sub_dim": 0.40352702140808105, "loss_vclub": 0.000759124755859375, "parscale_sim": 0.984375, "step": 849 }, { "epoch": 0.814176245210728, "grad_norm": 8.42410945892334, "learning_rate": 3.0263157894736843e-06, "loss": 0.789, "step": 850 }, { "epoch": 0.814176245210728, "loss_full_dim": 0.33257660269737244, "loss_main": 0.6807312965393066, "loss_parscale": 0.6875, "loss_sub_dim": 0.3481546938419342, "loss_vclub": 0.00079345703125, "parscale_sim": 0.984375, "step": 850 }, { "epoch": 0.8151340996168582, "grad_norm": 7.08062744140625, "learning_rate": 3.023684210526316e-06, "loss": 0.6807, "step": 851 }, { "epoch": 0.8151340996168582, "loss_full_dim": 0.38134562969207764, "loss_main": 0.7784899473190308, "loss_parscale": 0.78125, "loss_sub_dim": 0.3971443176269531, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.98828125, "step": 851 }, { "epoch": 0.8160919540229885, "grad_norm": 5.681840896606445, "learning_rate": 3.0210526315789474e-06, "loss": 0.7785, "step": 852 }, { "epoch": 0.8160919540229885, "loss_full_dim": 0.3868343234062195, "loss_main": 0.7916737198829651, "loss_parscale": 0.796875, "loss_sub_dim": 0.4048393964767456, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.98828125, "step": 852 }, { "epoch": 0.8170498084291188, "grad_norm": 9.125032424926758, "learning_rate": 3.0184210526315794e-06, "loss": 0.7917, "step": 853 }, { "epoch": 0.8170498084291188, "loss_full_dim": 0.3530697226524353, "loss_main": 0.7193547487258911, "loss_parscale": 0.70703125, "loss_sub_dim": 0.3662850260734558, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.98828125, "step": 853 }, { "epoch": 0.8180076628352491, "grad_norm": 148.15054321289062, "learning_rate": 3.015789473684211e-06, "loss": 0.7194, "step": 854 }, { "epoch": 0.8180076628352491, "loss_full_dim": 0.2893669903278351, "loss_main": 0.5922587513923645, "loss_parscale": 0.58984375, "loss_sub_dim": 0.3028917610645294, "loss_vclub": 0.00072479248046875, "parscale_sim": 0.9921875, "step": 854 }, { "epoch": 0.8189655172413793, "grad_norm": 8.4315767288208, "learning_rate": 3.013157894736842e-06, "loss": 0.5923, "step": 855 }, { "epoch": 0.8189655172413793, "loss_full_dim": 0.34922435879707336, "loss_main": 0.7163172364234924, "loss_parscale": 0.7265625, "loss_sub_dim": 0.36709287762641907, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.98046875, "step": 855 }, { "epoch": 0.8199233716475096, "grad_norm": 8.308494567871094, "learning_rate": 3.0105263157894737e-06, "loss": 0.7163, "step": 856 }, { "epoch": 0.8199233716475096, "loss_full_dim": 0.3359781503677368, "loss_main": 0.6873661279678345, "loss_parscale": 0.69921875, "loss_sub_dim": 0.35138797760009766, "loss_vclub": 0.000782012939453125, "parscale_sim": 0.984375, "step": 856 }, { "epoch": 0.8208812260536399, "grad_norm": 9.558688163757324, "learning_rate": 3.0078947368421058e-06, "loss": 0.6874, "step": 857 }, { "epoch": 0.8208812260536399, "loss_full_dim": 0.3294402062892914, "loss_main": 0.6729081869125366, "loss_parscale": 0.66796875, "loss_sub_dim": 0.3434680104255676, "loss_vclub": 0.000736236572265625, "parscale_sim": 0.98046875, "step": 857 }, { "epoch": 0.8218390804597702, "grad_norm": 13.547654151916504, "learning_rate": 3.0052631578947373e-06, "loss": 0.6729, "step": 858 }, { "epoch": 0.8218390804597702, "loss_full_dim": 0.3535515367984772, "loss_main": 0.7263714671134949, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3728199303150177, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.984375, "step": 858 }, { "epoch": 0.8227969348659003, "grad_norm": 11.198668479919434, "learning_rate": 3.0026315789473685e-06, "loss": 0.7264, "step": 859 }, { "epoch": 0.8227969348659003, "loss_full_dim": 0.3625544309616089, "loss_main": 0.7409087419509888, "loss_parscale": 0.7421875, "loss_sub_dim": 0.37835434079170227, "loss_vclub": 0.00072479248046875, "parscale_sim": 0.98828125, "step": 859 }, { "epoch": 0.8237547892720306, "grad_norm": 7.001635551452637, "learning_rate": 3e-06, "loss": 0.7409, "step": 860 }, { "epoch": 0.8237547892720306, "loss_full_dim": 0.2799288332462311, "loss_main": 0.5767382383346558, "loss_parscale": 0.57421875, "loss_sub_dim": 0.2968094050884247, "loss_vclub": 0.0005340576171875, "parscale_sim": 0.98828125, "step": 860 }, { "epoch": 0.8247126436781609, "grad_norm": 7.759574890136719, "learning_rate": 2.9973684210526317e-06, "loss": 0.5767, "step": 861 }, { "epoch": 0.8247126436781609, "loss_full_dim": 0.3483108580112457, "loss_main": 0.7160260677337646, "loss_parscale": 0.734375, "loss_sub_dim": 0.36771517992019653, "loss_vclub": 0.00084686279296875, "parscale_sim": 0.98828125, "step": 861 }, { "epoch": 0.8256704980842912, "grad_norm": 21.945158004760742, "learning_rate": 2.9947368421052637e-06, "loss": 0.716, "step": 862 }, { "epoch": 0.8256704980842912, "loss_full_dim": 0.35636892914772034, "loss_main": 0.7311338186264038, "loss_parscale": 0.7421875, "loss_sub_dim": 0.3747648596763611, "loss_vclub": 0.000736236572265625, "parscale_sim": 0.98828125, "step": 862 }, { "epoch": 0.8266283524904214, "grad_norm": 6.838197231292725, "learning_rate": 2.9921052631578952e-06, "loss": 0.7311, "step": 863 }, { "epoch": 0.8266283524904214, "loss_full_dim": 0.3352237045764923, "loss_main": 0.6846539974212646, "loss_parscale": 0.6796875, "loss_sub_dim": 0.34943026304244995, "loss_vclub": 0.000720977783203125, "parscale_sim": 0.984375, "step": 863 }, { "epoch": 0.8275862068965517, "grad_norm": 39.48699951171875, "learning_rate": 2.9894736842105264e-06, "loss": 0.6847, "step": 864 }, { "epoch": 0.8275862068965517, "loss_full_dim": 0.3147326111793518, "loss_main": 0.6467903256416321, "loss_parscale": 0.65625, "loss_sub_dim": 0.3320577144622803, "loss_vclub": 0.0009002685546875, "parscale_sim": 0.9921875, "step": 864 }, { "epoch": 0.828544061302682, "grad_norm": 6.135869979858398, "learning_rate": 2.986842105263158e-06, "loss": 0.6468, "step": 865 }, { "epoch": 0.828544061302682, "loss_full_dim": 0.3882702589035034, "loss_main": 0.7893517017364502, "loss_parscale": 0.79296875, "loss_sub_dim": 0.4010814428329468, "loss_vclub": 0.0005340576171875, "parscale_sim": 0.984375, "step": 865 }, { "epoch": 0.8295019157088123, "grad_norm": 6.808298110961914, "learning_rate": 2.9842105263157896e-06, "loss": 0.7894, "step": 866 }, { "epoch": 0.8295019157088123, "loss_full_dim": 0.33380138874053955, "loss_main": 0.6814193725585938, "loss_parscale": 0.68359375, "loss_sub_dim": 0.3476179540157318, "loss_vclub": 0.000675201416015625, "parscale_sim": 0.9765625, "step": 866 }, { "epoch": 0.8304597701149425, "grad_norm": 7.752024173736572, "learning_rate": 2.9815789473684216e-06, "loss": 0.6814, "step": 867 }, { "epoch": 0.8304597701149425, "loss_full_dim": 0.3773235082626343, "loss_main": 0.7734730243682861, "loss_parscale": 0.78125, "loss_sub_dim": 0.39614948630332947, "loss_vclub": 0.000682830810546875, "parscale_sim": 0.98828125, "step": 867 }, { "epoch": 0.8314176245210728, "grad_norm": 9.254548072814941, "learning_rate": 2.9789473684210527e-06, "loss": 0.7735, "step": 868 }, { "epoch": 0.8314176245210728, "loss_full_dim": 0.3765399158000946, "loss_main": 0.7675656080245972, "loss_parscale": 0.78125, "loss_sub_dim": 0.3910256624221802, "loss_vclub": 0.0009002685546875, "parscale_sim": 0.98828125, "step": 868 }, { "epoch": 0.8323754789272031, "grad_norm": 18.73403549194336, "learning_rate": 2.9763157894736843e-06, "loss": 0.7676, "step": 869 }, { "epoch": 0.8323754789272031, "loss_full_dim": 0.38168877363204956, "loss_main": 0.781649112701416, "loss_parscale": 0.78125, "loss_sub_dim": 0.39996033906936646, "loss_vclub": 0.0006103515625, "parscale_sim": 0.95703125, "step": 869 }, { "epoch": 0.8333333333333334, "grad_norm": 9.282000541687012, "learning_rate": 2.973684210526316e-06, "loss": 0.7816, "step": 870 }, { "epoch": 0.8333333333333334, "loss_full_dim": 0.33687713742256165, "loss_main": 0.6879532933235168, "loss_parscale": 0.703125, "loss_sub_dim": 0.3510761559009552, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.98828125, "step": 870 }, { "epoch": 0.8342911877394636, "grad_norm": 5.881676197052002, "learning_rate": 2.971052631578948e-06, "loss": 0.688, "step": 871 }, { "epoch": 0.8342911877394636, "loss_full_dim": 0.3505293130874634, "loss_main": 0.7161815166473389, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3656522035598755, "loss_vclub": 0.000614166259765625, "parscale_sim": 0.984375, "step": 871 }, { "epoch": 0.8352490421455939, "grad_norm": 6.601246356964111, "learning_rate": 2.9684210526315795e-06, "loss": 0.7162, "step": 872 }, { "epoch": 0.8352490421455939, "loss_full_dim": 0.29709571599960327, "loss_main": 0.6098365187644958, "loss_parscale": 0.609375, "loss_sub_dim": 0.3127408027648926, "loss_vclub": 0.000652313232421875, "parscale_sim": 0.984375, "step": 872 }, { "epoch": 0.8362068965517241, "grad_norm": 7.868386268615723, "learning_rate": 2.9657894736842106e-06, "loss": 0.6098, "step": 873 }, { "epoch": 0.8362068965517241, "loss_full_dim": 0.29992640018463135, "loss_main": 0.6131629943847656, "loss_parscale": 0.6171875, "loss_sub_dim": 0.3132365942001343, "loss_vclub": 0.000576019287109375, "parscale_sim": 0.98828125, "step": 873 }, { "epoch": 0.8371647509578544, "grad_norm": 10.950926780700684, "learning_rate": 2.9631578947368422e-06, "loss": 0.6132, "step": 874 }, { "epoch": 0.8371647509578544, "loss_full_dim": 0.3546949625015259, "loss_main": 0.7239624857902527, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3692675232887268, "loss_vclub": 0.000789642333984375, "parscale_sim": 0.98828125, "step": 874 }, { "epoch": 0.8381226053639846, "grad_norm": 8.95497989654541, "learning_rate": 2.960526315789474e-06, "loss": 0.724, "step": 875 }, { "epoch": 0.8381226053639846, "loss_full_dim": 0.29859814047813416, "loss_main": 0.6149457693099976, "loss_parscale": 0.625, "loss_sub_dim": 0.3163476586341858, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.98828125, "step": 875 }, { "epoch": 0.8390804597701149, "grad_norm": 7.937363147735596, "learning_rate": 2.957894736842106e-06, "loss": 0.6149, "step": 876 }, { "epoch": 0.8390804597701149, "loss_full_dim": 0.40412813425064087, "loss_main": 0.8227994441986084, "loss_parscale": 0.82421875, "loss_sub_dim": 0.41867130994796753, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98828125, "step": 876 }, { "epoch": 0.8400383141762452, "grad_norm": 8.224370956420898, "learning_rate": 2.955263157894737e-06, "loss": 0.8228, "step": 877 }, { "epoch": 0.8400383141762452, "loss_full_dim": 0.38002991676330566, "loss_main": 0.7765829563140869, "loss_parscale": 0.78125, "loss_sub_dim": 0.39655303955078125, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.984375, "step": 877 }, { "epoch": 0.8409961685823755, "grad_norm": 6.036620140075684, "learning_rate": 2.9526315789473685e-06, "loss": 0.7766, "step": 878 }, { "epoch": 0.8409961685823755, "loss_full_dim": 0.3131045699119568, "loss_main": 0.6428313851356506, "loss_parscale": 0.6484375, "loss_sub_dim": 0.32972681522369385, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.984375, "step": 878 }, { "epoch": 0.8419540229885057, "grad_norm": 9.84361743927002, "learning_rate": 2.95e-06, "loss": 0.6428, "step": 879 }, { "epoch": 0.8419540229885057, "loss_full_dim": 0.35383328795433044, "loss_main": 0.7234617471694946, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3696284294128418, "loss_vclub": 0.00058746337890625, "parscale_sim": 0.984375, "step": 879 }, { "epoch": 0.842911877394636, "grad_norm": 7.817811965942383, "learning_rate": 2.9473684210526317e-06, "loss": 0.7235, "step": 880 }, { "epoch": 0.842911877394636, "loss_full_dim": 0.3191705644130707, "loss_main": 0.6519443988800049, "loss_parscale": 0.6484375, "loss_sub_dim": 0.3327738344669342, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.98828125, "step": 880 }, { "epoch": 0.8438697318007663, "grad_norm": 7.289926052093506, "learning_rate": 2.9447368421052637e-06, "loss": 0.6519, "step": 881 }, { "epoch": 0.8438697318007663, "loss_full_dim": 0.37951239943504333, "loss_main": 0.7739800214767456, "loss_parscale": 0.7734375, "loss_sub_dim": 0.39446765184402466, "loss_vclub": 0.000762939453125, "parscale_sim": 0.984375, "step": 881 }, { "epoch": 0.8448275862068966, "grad_norm": 7.494056224822998, "learning_rate": 2.942105263157895e-06, "loss": 0.774, "step": 882 }, { "epoch": 0.8448275862068966, "loss_full_dim": 0.348783016204834, "loss_main": 0.7126447558403015, "loss_parscale": 0.71875, "loss_sub_dim": 0.36386173963546753, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.984375, "step": 882 }, { "epoch": 0.8457854406130269, "grad_norm": 9.255812644958496, "learning_rate": 2.9394736842105265e-06, "loss": 0.7126, "step": 883 }, { "epoch": 0.8457854406130269, "loss_full_dim": 0.31459352374076843, "loss_main": 0.6438037157058716, "loss_parscale": 0.64453125, "loss_sub_dim": 0.32921022176742554, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.984375, "step": 883 }, { "epoch": 0.8467432950191571, "grad_norm": 8.078822135925293, "learning_rate": 2.936842105263158e-06, "loss": 0.6438, "step": 884 }, { "epoch": 0.8467432950191571, "loss_full_dim": 0.3268764019012451, "loss_main": 0.6706519722938538, "loss_parscale": 0.67578125, "loss_sub_dim": 0.34377557039260864, "loss_vclub": 0.000644683837890625, "parscale_sim": 0.98046875, "step": 884 }, { "epoch": 0.8477011494252874, "grad_norm": 6.542845726013184, "learning_rate": 2.93421052631579e-06, "loss": 0.6707, "step": 885 }, { "epoch": 0.8477011494252874, "loss_full_dim": 0.3684973120689392, "loss_main": 0.7524536848068237, "loss_parscale": 0.75390625, "loss_sub_dim": 0.3839563727378845, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.98046875, "step": 885 }, { "epoch": 0.8486590038314177, "grad_norm": 13.55430793762207, "learning_rate": 2.931578947368421e-06, "loss": 0.7525, "step": 886 }, { "epoch": 0.8486590038314177, "loss_full_dim": 0.4029504954814911, "loss_main": 0.8240404725074768, "loss_parscale": 0.828125, "loss_sub_dim": 0.4210899770259857, "loss_vclub": 0.000881195068359375, "parscale_sim": 0.9765625, "step": 886 }, { "epoch": 0.8496168582375478, "grad_norm": 34.00449752807617, "learning_rate": 2.9289473684210528e-06, "loss": 0.824, "step": 887 }, { "epoch": 0.8496168582375478, "loss_full_dim": 0.3375106155872345, "loss_main": 0.6927956342697144, "loss_parscale": 0.68359375, "loss_sub_dim": 0.35528504848480225, "loss_vclub": 0.000667572021484375, "parscale_sim": 0.98046875, "step": 887 }, { "epoch": 0.8505747126436781, "grad_norm": 7.770313739776611, "learning_rate": 2.9263157894736844e-06, "loss": 0.6928, "step": 888 }, { "epoch": 0.8505747126436781, "loss_full_dim": 0.4073519706726074, "loss_main": 0.8340904116630554, "loss_parscale": 0.828125, "loss_sub_dim": 0.426738440990448, "loss_vclub": 0.000835418701171875, "parscale_sim": 0.98828125, "step": 888 }, { "epoch": 0.8515325670498084, "grad_norm": 73.17156219482422, "learning_rate": 2.923684210526316e-06, "loss": 0.8341, "step": 889 }, { "epoch": 0.8515325670498084, "loss_full_dim": 0.3497976064682007, "loss_main": 0.7158296704292297, "loss_parscale": 0.72265625, "loss_sub_dim": 0.36603206396102905, "loss_vclub": 0.00072479248046875, "parscale_sim": 0.98828125, "step": 889 }, { "epoch": 0.8524904214559387, "grad_norm": 7.433826446533203, "learning_rate": 2.921052631578948e-06, "loss": 0.7158, "step": 890 }, { "epoch": 0.8524904214559387, "loss_full_dim": 0.35396772623062134, "loss_main": 0.7220548987388611, "loss_parscale": 0.73046875, "loss_sub_dim": 0.36808717250823975, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98828125, "step": 890 }, { "epoch": 0.853448275862069, "grad_norm": 6.956943511962891, "learning_rate": 2.918421052631579e-06, "loss": 0.7221, "step": 891 }, { "epoch": 0.853448275862069, "loss_full_dim": 0.36999228596687317, "loss_main": 0.7565125823020935, "loss_parscale": 0.75390625, "loss_sub_dim": 0.38652029633522034, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.9921875, "step": 891 }, { "epoch": 0.8544061302681992, "grad_norm": 15.081738471984863, "learning_rate": 2.9157894736842107e-06, "loss": 0.7565, "step": 892 }, { "epoch": 0.8544061302681992, "loss_full_dim": 0.3516799509525299, "loss_main": 0.7219992876052856, "loss_parscale": 0.71875, "loss_sub_dim": 0.37031930685043335, "loss_vclub": 0.0008392333984375, "parscale_sim": 0.984375, "step": 892 }, { "epoch": 0.8553639846743295, "grad_norm": 9.384671211242676, "learning_rate": 2.9131578947368423e-06, "loss": 0.722, "step": 893 }, { "epoch": 0.8553639846743295, "loss_full_dim": 0.35142624378204346, "loss_main": 0.7194395065307617, "loss_parscale": 0.71484375, "loss_sub_dim": 0.3680132329463959, "loss_vclub": 0.00054168701171875, "parscale_sim": 0.984375, "step": 893 }, { "epoch": 0.8563218390804598, "grad_norm": 7.837365627288818, "learning_rate": 2.9105263157894743e-06, "loss": 0.7194, "step": 894 }, { "epoch": 0.8563218390804598, "loss_full_dim": 0.3381443917751312, "loss_main": 0.6920708417892456, "loss_parscale": 0.6953125, "loss_sub_dim": 0.35392647981643677, "loss_vclub": 0.00084686279296875, "parscale_sim": 0.98828125, "step": 894 }, { "epoch": 0.85727969348659, "grad_norm": 5.599165916442871, "learning_rate": 2.907894736842106e-06, "loss": 0.6921, "step": 895 }, { "epoch": 0.85727969348659, "loss_full_dim": 0.31646427512168884, "loss_main": 0.6490572690963745, "loss_parscale": 0.6484375, "loss_sub_dim": 0.33259299397468567, "loss_vclub": 0.000888824462890625, "parscale_sim": 0.98828125, "step": 895 }, { "epoch": 0.8582375478927203, "grad_norm": 7.448790073394775, "learning_rate": 2.905263157894737e-06, "loss": 0.6491, "step": 896 }, { "epoch": 0.8582375478927203, "loss_full_dim": 0.38033461570739746, "loss_main": 0.7771755456924438, "loss_parscale": 0.7890625, "loss_sub_dim": 0.3968409299850464, "loss_vclub": 0.000659942626953125, "parscale_sim": 0.984375, "step": 896 }, { "epoch": 0.8591954022988506, "grad_norm": 14.46817684173584, "learning_rate": 2.9026315789473686e-06, "loss": 0.7772, "step": 897 }, { "epoch": 0.8591954022988506, "loss_full_dim": 0.34550562500953674, "loss_main": 0.706440806388855, "loss_parscale": 0.70703125, "loss_sub_dim": 0.3609352111816406, "loss_vclub": 0.000812530517578125, "parscale_sim": 0.98828125, "step": 897 }, { "epoch": 0.8601532567049809, "grad_norm": 22.756938934326172, "learning_rate": 2.9e-06, "loss": 0.7064, "step": 898 }, { "epoch": 0.8601532567049809, "loss_full_dim": 0.3702312707901001, "loss_main": 0.7560946941375732, "loss_parscale": 0.74609375, "loss_sub_dim": 0.38586342334747314, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.98828125, "step": 898 }, { "epoch": 0.8611111111111112, "grad_norm": 8.624464988708496, "learning_rate": 2.897368421052632e-06, "loss": 0.7561, "step": 899 }, { "epoch": 0.8611111111111112, "loss_full_dim": 0.4103418290615082, "loss_main": 0.8381651043891907, "loss_parscale": 0.8359375, "loss_sub_dim": 0.4278232753276825, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.98828125, "step": 899 }, { "epoch": 0.8620689655172413, "grad_norm": 9.787681579589844, "learning_rate": 2.8947368421052634e-06, "loss": 0.8382, "step": 900 }, { "epoch": 0.8620689655172413, "loss_full_dim": 0.33820798993110657, "loss_main": 0.6918973922729492, "loss_parscale": 0.69921875, "loss_sub_dim": 0.35368940234184265, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.984375, "step": 900 }, { "epoch": 0.8630268199233716, "grad_norm": 8.384641647338867, "learning_rate": 2.892105263157895e-06, "loss": 0.6919, "step": 901 }, { "epoch": 0.8630268199233716, "loss_full_dim": 0.3399753272533417, "loss_main": 0.6968290209770203, "loss_parscale": 0.69140625, "loss_sub_dim": 0.3568536937236786, "loss_vclub": 0.000682830810546875, "parscale_sim": 0.98828125, "step": 901 }, { "epoch": 0.8639846743295019, "grad_norm": 6.394413948059082, "learning_rate": 2.8894736842105265e-06, "loss": 0.6968, "step": 902 }, { "epoch": 0.8639846743295019, "loss_full_dim": 0.3329375386238098, "loss_main": 0.682051420211792, "loss_parscale": 0.6875, "loss_sub_dim": 0.3491138815879822, "loss_vclub": 0.0005645751953125, "parscale_sim": 0.984375, "step": 902 }, { "epoch": 0.8649425287356322, "grad_norm": 7.206964015960693, "learning_rate": 2.886842105263158e-06, "loss": 0.6821, "step": 903 }, { "epoch": 0.8649425287356322, "loss_full_dim": 0.36833426356315613, "loss_main": 0.7514773607254028, "loss_parscale": 0.75390625, "loss_sub_dim": 0.3831430971622467, "loss_vclub": 0.000743865966796875, "parscale_sim": 0.98046875, "step": 903 }, { "epoch": 0.8659003831417624, "grad_norm": 10.813606262207031, "learning_rate": 2.88421052631579e-06, "loss": 0.7515, "step": 904 }, { "epoch": 0.8659003831417624, "loss_full_dim": 0.3640688955783844, "loss_main": 0.7471550703048706, "loss_parscale": 0.7421875, "loss_sub_dim": 0.3830861449241638, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.98828125, "step": 904 }, { "epoch": 0.8668582375478927, "grad_norm": 6.207857608795166, "learning_rate": 2.8815789473684213e-06, "loss": 0.7472, "step": 905 }, { "epoch": 0.8668582375478927, "loss_full_dim": 0.34123727679252625, "loss_main": 0.699095606803894, "loss_parscale": 0.6953125, "loss_sub_dim": 0.3578583002090454, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.984375, "step": 905 }, { "epoch": 0.867816091954023, "grad_norm": 139.3338623046875, "learning_rate": 2.878947368421053e-06, "loss": 0.6991, "step": 906 }, { "epoch": 0.867816091954023, "loss_full_dim": 0.3448452055454254, "loss_main": 0.7057451009750366, "loss_parscale": 0.7109375, "loss_sub_dim": 0.3608998656272888, "loss_vclub": 0.00072479248046875, "parscale_sim": 0.98828125, "step": 906 }, { "epoch": 0.8687739463601533, "grad_norm": 7.8703718185424805, "learning_rate": 2.8763157894736844e-06, "loss": 0.7057, "step": 907 }, { "epoch": 0.8687739463601533, "loss_full_dim": 0.3328796625137329, "loss_main": 0.6810639500617981, "loss_parscale": 0.68359375, "loss_sub_dim": 0.3481842875480652, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.9609375, "step": 907 }, { "epoch": 0.8697318007662835, "grad_norm": 7.154751300811768, "learning_rate": 2.8736842105263164e-06, "loss": 0.6811, "step": 908 }, { "epoch": 0.8697318007662835, "loss_full_dim": 0.342176616191864, "loss_main": 0.700751781463623, "loss_parscale": 0.69921875, "loss_sub_dim": 0.35857516527175903, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.98046875, "step": 908 }, { "epoch": 0.8706896551724138, "grad_norm": 149.76461791992188, "learning_rate": 2.8710526315789476e-06, "loss": 0.7008, "step": 909 }, { "epoch": 0.8706896551724138, "loss_full_dim": 0.3273458480834961, "loss_main": 0.6709938645362854, "loss_parscale": 0.65625, "loss_sub_dim": 0.3436480164527893, "loss_vclub": 0.000675201416015625, "parscale_sim": 0.98046875, "step": 909 }, { "epoch": 0.8716475095785441, "grad_norm": 19.65696144104004, "learning_rate": 2.868421052631579e-06, "loss": 0.671, "step": 910 }, { "epoch": 0.8716475095785441, "loss_full_dim": 0.3325536549091339, "loss_main": 0.6814312934875488, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3488776683807373, "loss_vclub": 0.000667572021484375, "parscale_sim": 0.984375, "step": 910 }, { "epoch": 0.8726053639846744, "grad_norm": 7.84154748916626, "learning_rate": 2.8657894736842108e-06, "loss": 0.6814, "step": 911 }, { "epoch": 0.8726053639846744, "loss_full_dim": 0.3134353458881378, "loss_main": 0.6426643133163452, "loss_parscale": 0.64453125, "loss_sub_dim": 0.3292289674282074, "loss_vclub": 0.000682830810546875, "parscale_sim": 0.98828125, "step": 911 }, { "epoch": 0.8735632183908046, "grad_norm": 8.065502166748047, "learning_rate": 2.8631578947368423e-06, "loss": 0.6427, "step": 912 }, { "epoch": 0.8735632183908046, "loss_full_dim": 0.350096732378006, "loss_main": 0.7158747911453247, "loss_parscale": 0.7109375, "loss_sub_dim": 0.3657780885696411, "loss_vclub": 0.000667572021484375, "parscale_sim": 0.98046875, "step": 912 }, { "epoch": 0.8745210727969349, "grad_norm": 9.904011726379395, "learning_rate": 2.8605263157894743e-06, "loss": 0.7159, "step": 913 }, { "epoch": 0.8745210727969349, "loss_full_dim": 0.30328473448753357, "loss_main": 0.6199547052383423, "loss_parscale": 0.62109375, "loss_sub_dim": 0.31666994094848633, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.984375, "step": 913 }, { "epoch": 0.8754789272030651, "grad_norm": 5.325815677642822, "learning_rate": 2.8578947368421055e-06, "loss": 0.62, "step": 914 }, { "epoch": 0.8754789272030651, "loss_full_dim": 0.3561640679836273, "loss_main": 0.7275159358978271, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3713518977165222, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.98828125, "step": 914 }, { "epoch": 0.8764367816091954, "grad_norm": 8.390939712524414, "learning_rate": 2.855263157894737e-06, "loss": 0.7275, "step": 915 }, { "epoch": 0.8764367816091954, "loss_full_dim": 0.36112144589424133, "loss_main": 0.7364975214004517, "loss_parscale": 0.734375, "loss_sub_dim": 0.3753761053085327, "loss_vclub": 0.000701904296875, "parscale_sim": 0.984375, "step": 915 }, { "epoch": 0.8773946360153256, "grad_norm": 8.913397789001465, "learning_rate": 2.8526315789473687e-06, "loss": 0.7365, "step": 916 }, { "epoch": 0.8773946360153256, "loss_full_dim": 0.3700898587703705, "loss_main": 0.7566033601760864, "loss_parscale": 0.75, "loss_sub_dim": 0.38651353120803833, "loss_vclub": 0.000644683837890625, "parscale_sim": 0.984375, "step": 916 }, { "epoch": 0.8783524904214559, "grad_norm": 8.229002952575684, "learning_rate": 2.85e-06, "loss": 0.7566, "step": 917 }, { "epoch": 0.8783524904214559, "loss_full_dim": 0.32592377066612244, "loss_main": 0.6679903268814087, "loss_parscale": 0.671875, "loss_sub_dim": 0.34206652641296387, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.96484375, "step": 917 }, { "epoch": 0.8793103448275862, "grad_norm": 6.871753692626953, "learning_rate": 2.847368421052632e-06, "loss": 0.668, "step": 918 }, { "epoch": 0.8793103448275862, "loss_full_dim": 0.33008769154548645, "loss_main": 0.6765271425247192, "loss_parscale": 0.69140625, "loss_sub_dim": 0.3464394807815552, "loss_vclub": 0.0009002685546875, "parscale_sim": 0.98828125, "step": 918 }, { "epoch": 0.8802681992337165, "grad_norm": 6.808361053466797, "learning_rate": 2.8447368421052634e-06, "loss": 0.6765, "step": 919 }, { "epoch": 0.8802681992337165, "loss_full_dim": 0.3296225965023041, "loss_main": 0.6753994822502136, "loss_parscale": 0.6796875, "loss_sub_dim": 0.34577688574790955, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.984375, "step": 919 }, { "epoch": 0.8812260536398467, "grad_norm": 7.643487453460693, "learning_rate": 2.842105263157895e-06, "loss": 0.6754, "step": 920 }, { "epoch": 0.8812260536398467, "loss_full_dim": 0.3656436502933502, "loss_main": 0.7471087574958801, "loss_parscale": 0.74609375, "loss_sub_dim": 0.3814651072025299, "loss_vclub": 0.000804901123046875, "parscale_sim": 0.984375, "step": 920 }, { "epoch": 0.882183908045977, "grad_norm": 4.205369472503662, "learning_rate": 2.8394736842105266e-06, "loss": 0.7471, "step": 921 }, { "epoch": 0.882183908045977, "loss_full_dim": 0.33784914016723633, "loss_main": 0.6923626661300659, "loss_parscale": 0.703125, "loss_sub_dim": 0.3545135259628296, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.984375, "step": 921 }, { "epoch": 0.8831417624521073, "grad_norm": 10.529537200927734, "learning_rate": 2.8368421052631586e-06, "loss": 0.6924, "step": 922 }, { "epoch": 0.8831417624521073, "loss_full_dim": 0.35109227895736694, "loss_main": 0.7151709198951721, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3640786409378052, "loss_vclub": 0.00058746337890625, "parscale_sim": 0.984375, "step": 922 }, { "epoch": 0.8840996168582376, "grad_norm": 5.127645492553711, "learning_rate": 2.8342105263157897e-06, "loss": 0.7152, "step": 923 }, { "epoch": 0.8840996168582376, "loss_full_dim": 0.3586982190608978, "loss_main": 0.736346960067749, "loss_parscale": 0.74609375, "loss_sub_dim": 0.3776487112045288, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.98828125, "step": 923 }, { "epoch": 0.8850574712643678, "grad_norm": 8.64691162109375, "learning_rate": 2.8315789473684213e-06, "loss": 0.7363, "step": 924 }, { "epoch": 0.8850574712643678, "loss_full_dim": 0.32164353132247925, "loss_main": 0.6579959392547607, "loss_parscale": 0.65625, "loss_sub_dim": 0.3363524377346039, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.98828125, "step": 924 }, { "epoch": 0.8860153256704981, "grad_norm": 9.519312858581543, "learning_rate": 2.828947368421053e-06, "loss": 0.658, "step": 925 }, { "epoch": 0.8860153256704981, "loss_full_dim": 0.3440316915512085, "loss_main": 0.702698826789856, "loss_parscale": 0.7109375, "loss_sub_dim": 0.35866713523864746, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.98828125, "step": 925 }, { "epoch": 0.8869731800766284, "grad_norm": 8.511509895324707, "learning_rate": 2.826315789473684e-06, "loss": 0.7027, "step": 926 }, { "epoch": 0.8869731800766284, "loss_full_dim": 0.2913690507411957, "loss_main": 0.5950907468795776, "loss_parscale": 0.6015625, "loss_sub_dim": 0.30372169613838196, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.984375, "step": 926 }, { "epoch": 0.8879310344827587, "grad_norm": 5.671322822570801, "learning_rate": 2.823684210526316e-06, "loss": 0.5951, "step": 927 }, { "epoch": 0.8879310344827587, "loss_full_dim": 0.35852062702178955, "loss_main": 0.7332503199577332, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3747296929359436, "loss_vclub": 0.000804901123046875, "parscale_sim": 0.96484375, "step": 927 }, { "epoch": 0.8888888888888888, "grad_norm": 7.037281036376953, "learning_rate": 2.8210526315789476e-06, "loss": 0.7333, "step": 928 }, { "epoch": 0.8888888888888888, "loss_full_dim": 0.370576947927475, "loss_main": 0.7583469152450562, "loss_parscale": 0.765625, "loss_sub_dim": 0.3877699375152588, "loss_vclub": 0.000621795654296875, "parscale_sim": 0.98828125, "step": 928 }, { "epoch": 0.8898467432950191, "grad_norm": 8.955153465270996, "learning_rate": 2.8184210526315792e-06, "loss": 0.7583, "step": 929 }, { "epoch": 0.8898467432950191, "loss_full_dim": 0.33068162202835083, "loss_main": 0.6769073009490967, "loss_parscale": 0.6796875, "loss_sub_dim": 0.34622567892074585, "loss_vclub": 0.000652313232421875, "parscale_sim": 0.984375, "step": 929 }, { "epoch": 0.8908045977011494, "grad_norm": 14.687442779541016, "learning_rate": 2.815789473684211e-06, "loss": 0.6769, "step": 930 }, { "epoch": 0.8908045977011494, "loss_full_dim": 0.3513534665107727, "loss_main": 0.718526303768158, "loss_parscale": 0.72265625, "loss_sub_dim": 0.36717283725738525, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.98828125, "step": 930 }, { "epoch": 0.8917624521072797, "grad_norm": 7.761190891265869, "learning_rate": 2.813157894736842e-06, "loss": 0.7185, "step": 931 }, { "epoch": 0.8917624521072797, "loss_full_dim": 0.3093845546245575, "loss_main": 0.6338789463043213, "loss_parscale": 0.640625, "loss_sub_dim": 0.3244943618774414, "loss_vclub": 0.000591278076171875, "parscale_sim": 0.98828125, "step": 931 }, { "epoch": 0.89272030651341, "grad_norm": 8.159764289855957, "learning_rate": 2.810526315789474e-06, "loss": 0.6339, "step": 932 }, { "epoch": 0.89272030651341, "loss_full_dim": 0.343359112739563, "loss_main": 0.7009860277175903, "loss_parscale": 0.6953125, "loss_sub_dim": 0.35762691497802734, "loss_vclub": 0.000743865966796875, "parscale_sim": 0.984375, "step": 932 }, { "epoch": 0.8936781609195402, "grad_norm": 7.107862949371338, "learning_rate": 2.8078947368421056e-06, "loss": 0.701, "step": 933 }, { "epoch": 0.8936781609195402, "loss_full_dim": 0.28799790143966675, "loss_main": 0.5890089273452759, "loss_parscale": 0.6015625, "loss_sub_dim": 0.30101099610328674, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98046875, "step": 933 }, { "epoch": 0.8946360153256705, "grad_norm": 7.920376777648926, "learning_rate": 2.805263157894737e-06, "loss": 0.589, "step": 934 }, { "epoch": 0.8946360153256705, "loss_full_dim": 0.2697123885154724, "loss_main": 0.5536733269691467, "loss_parscale": 0.55078125, "loss_sub_dim": 0.2839609384536743, "loss_vclub": 0.000598907470703125, "parscale_sim": 0.984375, "step": 934 }, { "epoch": 0.8955938697318008, "grad_norm": 6.622039318084717, "learning_rate": 2.8026315789473683e-06, "loss": 0.5537, "step": 935 }, { "epoch": 0.8955938697318008, "loss_full_dim": 0.3712245523929596, "loss_main": 0.7603943347930908, "loss_parscale": 0.76171875, "loss_sub_dim": 0.3891698122024536, "loss_vclub": 0.000560760498046875, "parscale_sim": 0.9765625, "step": 935 }, { "epoch": 0.896551724137931, "grad_norm": 7.583546161651611, "learning_rate": 2.8000000000000003e-06, "loss": 0.7604, "step": 936 }, { "epoch": 0.896551724137931, "loss_full_dim": 0.35297995805740356, "loss_main": 0.7195560932159424, "loss_parscale": 0.71875, "loss_sub_dim": 0.3665761649608612, "loss_vclub": 0.00055694580078125, "parscale_sim": 0.98828125, "step": 936 }, { "epoch": 0.8975095785440613, "grad_norm": 15.52218246459961, "learning_rate": 2.797368421052632e-06, "loss": 0.7196, "step": 937 }, { "epoch": 0.8975095785440613, "loss_full_dim": 0.36785781383514404, "loss_main": 0.7521650791168213, "loss_parscale": 0.7421875, "loss_sub_dim": 0.38430726528167725, "loss_vclub": 0.000579833984375, "parscale_sim": 0.98828125, "step": 937 }, { "epoch": 0.8984674329501916, "grad_norm": 7.4116530418396, "learning_rate": 2.7947368421052635e-06, "loss": 0.7522, "step": 938 }, { "epoch": 0.8984674329501916, "loss_full_dim": 0.27627870440483093, "loss_main": 0.5660357475280762, "loss_parscale": 0.5703125, "loss_sub_dim": 0.28975701332092285, "loss_vclub": 0.00058746337890625, "parscale_sim": 0.984375, "step": 938 }, { "epoch": 0.8994252873563219, "grad_norm": 38.79964828491211, "learning_rate": 2.792105263157895e-06, "loss": 0.566, "step": 939 }, { "epoch": 0.8994252873563219, "loss_full_dim": 0.40671294927597046, "loss_main": 0.8300405144691467, "loss_parscale": 0.8359375, "loss_sub_dim": 0.42332756519317627, "loss_vclub": 0.000701904296875, "parscale_sim": 0.98828125, "step": 939 }, { "epoch": 0.9003831417624522, "grad_norm": 11.037788391113281, "learning_rate": 2.789473684210526e-06, "loss": 0.83, "step": 940 }, { "epoch": 0.9003831417624522, "loss_full_dim": 0.34082627296447754, "loss_main": 0.6978436708450317, "loss_parscale": 0.6953125, "loss_sub_dim": 0.3570173680782318, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.984375, "step": 940 }, { "epoch": 0.9013409961685823, "grad_norm": 50.05608367919922, "learning_rate": 2.786842105263158e-06, "loss": 0.6978, "step": 941 }, { "epoch": 0.9013409961685823, "loss_full_dim": 0.3414318561553955, "loss_main": 0.6958320736885071, "loss_parscale": 0.6953125, "loss_sub_dim": 0.3544002175331116, "loss_vclub": 0.000820159912109375, "parscale_sim": 0.984375, "step": 941 }, { "epoch": 0.9022988505747126, "grad_norm": 9.6146879196167, "learning_rate": 2.7842105263157898e-06, "loss": 0.6958, "step": 942 }, { "epoch": 0.9022988505747126, "loss_full_dim": 0.3920171856880188, "loss_main": 0.8017415404319763, "loss_parscale": 0.8046875, "loss_sub_dim": 0.4097243547439575, "loss_vclub": 0.000804901123046875, "parscale_sim": 0.98046875, "step": 942 }, { "epoch": 0.9032567049808429, "grad_norm": 6.980498313903809, "learning_rate": 2.7815789473684214e-06, "loss": 0.8017, "step": 943 }, { "epoch": 0.9032567049808429, "loss_full_dim": 0.3206935226917267, "loss_main": 0.6591084003448486, "loss_parscale": 0.66796875, "loss_sub_dim": 0.33841484785079956, "loss_vclub": 0.000644683837890625, "parscale_sim": 0.98828125, "step": 943 }, { "epoch": 0.9042145593869731, "grad_norm": 7.432158946990967, "learning_rate": 2.7789473684210525e-06, "loss": 0.6591, "step": 944 }, { "epoch": 0.9042145593869731, "loss_full_dim": 0.3230404257774353, "loss_main": 0.6619117856025696, "loss_parscale": 0.6640625, "loss_sub_dim": 0.3388713598251343, "loss_vclub": 0.00067138671875, "parscale_sim": 0.9765625, "step": 944 }, { "epoch": 0.9051724137931034, "grad_norm": 12.421504974365234, "learning_rate": 2.776315789473684e-06, "loss": 0.6619, "step": 945 }, { "epoch": 0.9051724137931034, "loss_full_dim": 0.2801661193370819, "loss_main": 0.5750322937965393, "loss_parscale": 0.57421875, "loss_sub_dim": 0.2948661744594574, "loss_vclub": 0.00067138671875, "parscale_sim": 0.98828125, "step": 945 }, { "epoch": 0.9061302681992337, "grad_norm": 5.187319278717041, "learning_rate": 2.773684210526316e-06, "loss": 0.575, "step": 946 }, { "epoch": 0.9061302681992337, "loss_full_dim": 0.44359129667282104, "loss_main": 0.9051036238670349, "loss_parscale": 0.90625, "loss_sub_dim": 0.46151232719421387, "loss_vclub": 0.00079345703125, "parscale_sim": 0.9765625, "step": 946 }, { "epoch": 0.907088122605364, "grad_norm": 9.611565589904785, "learning_rate": 2.7710526315789477e-06, "loss": 0.9051, "step": 947 }, { "epoch": 0.907088122605364, "loss_full_dim": 0.3805622160434723, "loss_main": 0.7792695760726929, "loss_parscale": 0.7734375, "loss_sub_dim": 0.3987073302268982, "loss_vclub": 0.000553131103515625, "parscale_sim": 0.97265625, "step": 947 }, { "epoch": 0.9080459770114943, "grad_norm": 11.460492134094238, "learning_rate": 2.7684210526315793e-06, "loss": 0.7793, "step": 948 }, { "epoch": 0.9080459770114943, "loss_full_dim": 0.40089523792266846, "loss_main": 0.8200491070747375, "loss_parscale": 0.80859375, "loss_sub_dim": 0.4191538691520691, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.984375, "step": 948 }, { "epoch": 0.9090038314176245, "grad_norm": 7.064073085784912, "learning_rate": 2.7657894736842104e-06, "loss": 0.82, "step": 949 }, { "epoch": 0.9090038314176245, "loss_full_dim": 0.36152705550193787, "loss_main": 0.741690993309021, "loss_parscale": 0.7421875, "loss_sub_dim": 0.38016390800476074, "loss_vclub": 0.000873565673828125, "parscale_sim": 0.984375, "step": 949 }, { "epoch": 0.9099616858237548, "grad_norm": 8.650694847106934, "learning_rate": 2.7631578947368424e-06, "loss": 0.7417, "step": 950 }, { "epoch": 0.9099616858237548, "loss_full_dim": 0.40121641755104065, "loss_main": 0.8226373195648193, "loss_parscale": 0.828125, "loss_sub_dim": 0.4214209318161011, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.98828125, "step": 950 }, { "epoch": 0.9109195402298851, "grad_norm": 74.95230865478516, "learning_rate": 2.760526315789474e-06, "loss": 0.8226, "step": 951 }, { "epoch": 0.9109195402298851, "loss_full_dim": 0.34725406765937805, "loss_main": 0.7112765312194824, "loss_parscale": 0.71875, "loss_sub_dim": 0.364022433757782, "loss_vclub": 0.00079345703125, "parscale_sim": 0.984375, "step": 951 }, { "epoch": 0.9118773946360154, "grad_norm": 9.418596267700195, "learning_rate": 2.7578947368421056e-06, "loss": 0.7113, "step": 952 }, { "epoch": 0.9118773946360154, "loss_full_dim": 0.27905139327049255, "loss_main": 0.5725299119949341, "loss_parscale": 0.578125, "loss_sub_dim": 0.29347848892211914, "loss_vclub": 0.000743865966796875, "parscale_sim": 0.98828125, "step": 952 }, { "epoch": 0.9128352490421456, "grad_norm": 8.08649730682373, "learning_rate": 2.7552631578947368e-06, "loss": 0.5725, "step": 953 }, { "epoch": 0.9128352490421456, "loss_full_dim": 0.3743758201599121, "loss_main": 0.7651118040084839, "loss_parscale": 0.7578125, "loss_sub_dim": 0.3907359838485718, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.98828125, "step": 953 }, { "epoch": 0.9137931034482759, "grad_norm": 6.540586471557617, "learning_rate": 2.7526315789473683e-06, "loss": 0.7651, "step": 954 }, { "epoch": 0.9137931034482759, "loss_full_dim": 0.32465630769729614, "loss_main": 0.6691572070121765, "loss_parscale": 0.68359375, "loss_sub_dim": 0.34450089931488037, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.98828125, "step": 954 }, { "epoch": 0.9147509578544061, "grad_norm": 15.078311920166016, "learning_rate": 2.7500000000000004e-06, "loss": 0.6692, "step": 955 }, { "epoch": 0.9147509578544061, "loss_full_dim": 0.3151005804538727, "loss_main": 0.6449224948883057, "loss_parscale": 0.65234375, "loss_sub_dim": 0.329821914434433, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.98828125, "step": 955 }, { "epoch": 0.9157088122605364, "grad_norm": 7.67079496383667, "learning_rate": 2.747368421052632e-06, "loss": 0.6449, "step": 956 }, { "epoch": 0.9157088122605364, "loss_full_dim": 0.2725914716720581, "loss_main": 0.5581051111221313, "loss_parscale": 0.55859375, "loss_sub_dim": 0.28551363945007324, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.98828125, "step": 956 }, { "epoch": 0.9166666666666666, "grad_norm": 8.666061401367188, "learning_rate": 2.7447368421052635e-06, "loss": 0.5581, "step": 957 }, { "epoch": 0.9166666666666666, "loss_full_dim": 0.4016520380973816, "loss_main": 0.8215457797050476, "loss_parscale": 0.8203125, "loss_sub_dim": 0.419893741607666, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98046875, "step": 957 }, { "epoch": 0.9176245210727969, "grad_norm": 5.573220729827881, "learning_rate": 2.7421052631578947e-06, "loss": 0.8215, "step": 958 }, { "epoch": 0.9176245210727969, "loss_full_dim": 0.334060400724411, "loss_main": 0.6830474734306335, "loss_parscale": 0.6796875, "loss_sub_dim": 0.34898707270622253, "loss_vclub": 0.000629425048828125, "parscale_sim": 0.9609375, "step": 958 }, { "epoch": 0.9185823754789272, "grad_norm": 11.58786392211914, "learning_rate": 2.7394736842105263e-06, "loss": 0.683, "step": 959 }, { "epoch": 0.9185823754789272, "loss_full_dim": 0.3226364850997925, "loss_main": 0.6614015698432922, "loss_parscale": 0.67578125, "loss_sub_dim": 0.33876508474349976, "loss_vclub": 0.000606536865234375, "parscale_sim": 0.98046875, "step": 959 }, { "epoch": 0.9195402298850575, "grad_norm": 8.430212020874023, "learning_rate": 2.7368421052631583e-06, "loss": 0.6614, "step": 960 }, { "epoch": 0.9195402298850575, "loss_full_dim": 0.31322577595710754, "loss_main": 0.6407754421234131, "loss_parscale": 0.6484375, "loss_sub_dim": 0.32754963636398315, "loss_vclub": 0.000850677490234375, "parscale_sim": 0.984375, "step": 960 }, { "epoch": 0.9204980842911877, "grad_norm": 8.175201416015625, "learning_rate": 2.73421052631579e-06, "loss": 0.6408, "step": 961 }, { "epoch": 0.9204980842911877, "loss_full_dim": 0.3384082019329071, "loss_main": 0.693867564201355, "loss_parscale": 0.6875, "loss_sub_dim": 0.3554593324661255, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.98828125, "step": 961 }, { "epoch": 0.921455938697318, "grad_norm": 8.879694938659668, "learning_rate": 2.7315789473684214e-06, "loss": 0.6939, "step": 962 }, { "epoch": 0.921455938697318, "loss_full_dim": 0.4093545079231262, "loss_main": 0.8360594511032104, "loss_parscale": 0.83984375, "loss_sub_dim": 0.4267049729824066, "loss_vclub": 0.000705718994140625, "parscale_sim": 0.984375, "step": 962 }, { "epoch": 0.9224137931034483, "grad_norm": 9.22118854522705, "learning_rate": 2.7289473684210526e-06, "loss": 0.8361, "step": 963 }, { "epoch": 0.9224137931034483, "loss_full_dim": 0.37299826741218567, "loss_main": 0.7634646892547607, "loss_parscale": 0.76953125, "loss_sub_dim": 0.3904663920402527, "loss_vclub": 0.000888824462890625, "parscale_sim": 0.984375, "step": 963 }, { "epoch": 0.9233716475095786, "grad_norm": 7.180814743041992, "learning_rate": 2.7263157894736846e-06, "loss": 0.7635, "step": 964 }, { "epoch": 0.9233716475095786, "loss_full_dim": 0.32852354645729065, "loss_main": 0.6731805801391602, "loss_parscale": 0.66796875, "loss_sub_dim": 0.3446570038795471, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98046875, "step": 964 }, { "epoch": 0.9243295019157088, "grad_norm": 8.86963176727295, "learning_rate": 2.723684210526316e-06, "loss": 0.6732, "step": 965 }, { "epoch": 0.9243295019157088, "loss_full_dim": 0.33910080790519714, "loss_main": 0.6948814392089844, "loss_parscale": 0.7109375, "loss_sub_dim": 0.3557806611061096, "loss_vclub": 0.000652313232421875, "parscale_sim": 0.984375, "step": 965 }, { "epoch": 0.9252873563218391, "grad_norm": 9.05751895904541, "learning_rate": 2.7210526315789478e-06, "loss": 0.6949, "step": 966 }, { "epoch": 0.9252873563218391, "loss_full_dim": 0.39381614327430725, "loss_main": 0.8038371801376343, "loss_parscale": 0.8046875, "loss_sub_dim": 0.41002100706100464, "loss_vclub": 0.00072479248046875, "parscale_sim": 0.95703125, "step": 966 }, { "epoch": 0.9262452107279694, "grad_norm": 15.227457046508789, "learning_rate": 2.718421052631579e-06, "loss": 0.8038, "step": 967 }, { "epoch": 0.9262452107279694, "loss_full_dim": 0.35743728280067444, "loss_main": 0.7346208095550537, "loss_parscale": 0.7421875, "loss_sub_dim": 0.37718355655670166, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98828125, "step": 967 }, { "epoch": 0.9272030651340997, "grad_norm": 11.193381309509277, "learning_rate": 2.7157894736842105e-06, "loss": 0.7346, "step": 968 }, { "epoch": 0.9272030651340997, "loss_full_dim": 0.33252963423728943, "loss_main": 0.680465817451477, "loss_parscale": 0.6796875, "loss_sub_dim": 0.34793615341186523, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.98046875, "step": 968 }, { "epoch": 0.9281609195402298, "grad_norm": 8.302539825439453, "learning_rate": 2.7131578947368425e-06, "loss": 0.6805, "step": 969 }, { "epoch": 0.9281609195402298, "loss_full_dim": 0.3011888265609741, "loss_main": 0.6182879209518433, "loss_parscale": 0.625, "loss_sub_dim": 0.31709906458854675, "loss_vclub": 0.000732421875, "parscale_sim": 0.98828125, "step": 969 }, { "epoch": 0.9291187739463601, "grad_norm": 8.371973991394043, "learning_rate": 2.710526315789474e-06, "loss": 0.6183, "step": 970 }, { "epoch": 0.9291187739463601, "loss_full_dim": 0.34607091546058655, "loss_main": 0.7073670625686646, "loss_parscale": 0.703125, "loss_sub_dim": 0.3612961173057556, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.98046875, "step": 970 }, { "epoch": 0.9300766283524904, "grad_norm": 14.741491317749023, "learning_rate": 2.7078947368421057e-06, "loss": 0.7074, "step": 971 }, { "epoch": 0.9300766283524904, "loss_full_dim": 0.3363267779350281, "loss_main": 0.688217282295227, "loss_parscale": 0.6875, "loss_sub_dim": 0.351890504360199, "loss_vclub": 0.000774383544921875, "parscale_sim": 0.98828125, "step": 971 }, { "epoch": 0.9310344827586207, "grad_norm": 8.901603698730469, "learning_rate": 2.705263157894737e-06, "loss": 0.6882, "step": 972 }, { "epoch": 0.9310344827586207, "loss_full_dim": 0.3228759467601776, "loss_main": 0.6630109548568726, "loss_parscale": 0.66796875, "loss_sub_dim": 0.34013497829437256, "loss_vclub": 0.000732421875, "parscale_sim": 0.98828125, "step": 972 }, { "epoch": 0.9319923371647509, "grad_norm": 6.1910786628723145, "learning_rate": 2.7026315789473684e-06, "loss": 0.663, "step": 973 }, { "epoch": 0.9319923371647509, "loss_full_dim": 0.3232079744338989, "loss_main": 0.6614378094673157, "loss_parscale": 0.6640625, "loss_sub_dim": 0.33822983503341675, "loss_vclub": 0.000797271728515625, "parscale_sim": 0.984375, "step": 973 }, { "epoch": 0.9329501915708812, "grad_norm": 7.434993267059326, "learning_rate": 2.7000000000000004e-06, "loss": 0.6614, "step": 974 }, { "epoch": 0.9329501915708812, "loss_full_dim": 0.34001049399375916, "loss_main": 0.6954053640365601, "loss_parscale": 0.69140625, "loss_sub_dim": 0.3553948998451233, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98828125, "step": 974 }, { "epoch": 0.9339080459770115, "grad_norm": 4.543356895446777, "learning_rate": 2.697368421052632e-06, "loss": 0.6954, "step": 975 }, { "epoch": 0.9339080459770115, "loss_full_dim": 0.28276965022087097, "loss_main": 0.581802248954773, "loss_parscale": 0.5859375, "loss_sub_dim": 0.299032598733902, "loss_vclub": 0.000690460205078125, "parscale_sim": 0.984375, "step": 975 }, { "epoch": 0.9348659003831418, "grad_norm": 6.242292404174805, "learning_rate": 2.694736842105263e-06, "loss": 0.5818, "step": 976 }, { "epoch": 0.9348659003831418, "loss_full_dim": 0.3246418535709381, "loss_main": 0.6649823784828186, "loss_parscale": 0.671875, "loss_sub_dim": 0.3403405249118805, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.984375, "step": 976 }, { "epoch": 0.935823754789272, "grad_norm": 19.38972282409668, "learning_rate": 2.6921052631578947e-06, "loss": 0.665, "step": 977 }, { "epoch": 0.935823754789272, "loss_full_dim": 0.36760184168815613, "loss_main": 0.7491874694824219, "loss_parscale": 0.75, "loss_sub_dim": 0.38158565759658813, "loss_vclub": 0.000743865966796875, "parscale_sim": 0.98046875, "step": 977 }, { "epoch": 0.9367816091954023, "grad_norm": 11.820640563964844, "learning_rate": 2.6894736842105267e-06, "loss": 0.7492, "step": 978 }, { "epoch": 0.9367816091954023, "loss_full_dim": 0.2919006943702698, "loss_main": 0.5982301831245422, "loss_parscale": 0.59765625, "loss_sub_dim": 0.30632948875427246, "loss_vclub": 0.000682830810546875, "parscale_sim": 0.984375, "step": 978 }, { "epoch": 0.9377394636015326, "grad_norm": 8.491400718688965, "learning_rate": 2.6868421052631583e-06, "loss": 0.5982, "step": 979 }, { "epoch": 0.9377394636015326, "loss_full_dim": 0.3084620237350464, "loss_main": 0.6323287487030029, "loss_parscale": 0.625, "loss_sub_dim": 0.32386672496795654, "loss_vclub": 0.000644683837890625, "parscale_sim": 0.984375, "step": 979 }, { "epoch": 0.9386973180076629, "grad_norm": 23.016775131225586, "learning_rate": 2.68421052631579e-06, "loss": 0.6323, "step": 980 }, { "epoch": 0.9386973180076629, "loss_full_dim": 0.3196735978126526, "loss_main": 0.657806932926178, "loss_parscale": 0.671875, "loss_sub_dim": 0.3381333351135254, "loss_vclub": 0.000598907470703125, "parscale_sim": 0.984375, "step": 980 }, { "epoch": 0.9396551724137931, "grad_norm": 4.83700704574585, "learning_rate": 2.681578947368421e-06, "loss": 0.6578, "step": 981 }, { "epoch": 0.9396551724137931, "loss_full_dim": 0.32424765825271606, "loss_main": 0.6638554334640503, "loss_parscale": 0.6640625, "loss_sub_dim": 0.33960777521133423, "loss_vclub": 0.000820159912109375, "parscale_sim": 0.98828125, "step": 981 }, { "epoch": 0.9406130268199234, "grad_norm": 9.451693534851074, "learning_rate": 2.6789473684210526e-06, "loss": 0.6639, "step": 982 }, { "epoch": 0.9406130268199234, "loss_full_dim": 0.35476502776145935, "loss_main": 0.7241904139518738, "loss_parscale": 0.72265625, "loss_sub_dim": 0.36942538619041443, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.98046875, "step": 982 }, { "epoch": 0.9415708812260536, "grad_norm": 54.13290786743164, "learning_rate": 2.6763157894736846e-06, "loss": 0.7242, "step": 983 }, { "epoch": 0.9415708812260536, "loss_full_dim": 0.29818037152290344, "loss_main": 0.6075798273086548, "loss_parscale": 0.609375, "loss_sub_dim": 0.30939948558807373, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.984375, "step": 983 }, { "epoch": 0.9425287356321839, "grad_norm": 7.45620059967041, "learning_rate": 2.6736842105263162e-06, "loss": 0.6076, "step": 984 }, { "epoch": 0.9425287356321839, "loss_full_dim": 0.31818485260009766, "loss_main": 0.6546238660812378, "loss_parscale": 0.66015625, "loss_sub_dim": 0.33643898367881775, "loss_vclub": 0.000621795654296875, "parscale_sim": 0.984375, "step": 984 }, { "epoch": 0.9434865900383141, "grad_norm": 5.760212421417236, "learning_rate": 2.6710526315789474e-06, "loss": 0.6546, "step": 985 }, { "epoch": 0.9434865900383141, "loss_full_dim": 0.38443806767463684, "loss_main": 0.7843769788742065, "loss_parscale": 0.7890625, "loss_sub_dim": 0.3999389410018921, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.98828125, "step": 985 }, { "epoch": 0.9444444444444444, "grad_norm": 8.426176071166992, "learning_rate": 2.668421052631579e-06, "loss": 0.7844, "step": 986 }, { "epoch": 0.9444444444444444, "loss_full_dim": 0.3334839940071106, "loss_main": 0.6826735734939575, "loss_parscale": 0.68359375, "loss_sub_dim": 0.34918954968452454, "loss_vclub": 0.00060272216796875, "parscale_sim": 0.98828125, "step": 986 }, { "epoch": 0.9454022988505747, "grad_norm": 6.9639177322387695, "learning_rate": 2.6657894736842105e-06, "loss": 0.6827, "step": 987 }, { "epoch": 0.9454022988505747, "loss_full_dim": 0.3386130928993225, "loss_main": 0.6929627060890198, "loss_parscale": 0.6953125, "loss_sub_dim": 0.35434961318969727, "loss_vclub": 0.000614166259765625, "parscale_sim": 0.984375, "step": 987 }, { "epoch": 0.946360153256705, "grad_norm": 7.601863384246826, "learning_rate": 2.6631578947368426e-06, "loss": 0.693, "step": 988 }, { "epoch": 0.946360153256705, "loss_full_dim": 0.3243293762207031, "loss_main": 0.662812352180481, "loss_parscale": 0.66796875, "loss_sub_dim": 0.33848297595977783, "loss_vclub": 0.000621795654296875, "parscale_sim": 0.984375, "step": 988 }, { "epoch": 0.9473180076628352, "grad_norm": 6.013468265533447, "learning_rate": 2.660526315789474e-06, "loss": 0.6628, "step": 989 }, { "epoch": 0.9473180076628352, "loss_full_dim": 0.3665591776371002, "loss_main": 0.7476669549942017, "loss_parscale": 0.75390625, "loss_sub_dim": 0.38110774755477905, "loss_vclub": 0.00067138671875, "parscale_sim": 0.98828125, "step": 989 }, { "epoch": 0.9482758620689655, "grad_norm": 7.408607482910156, "learning_rate": 2.6578947368421053e-06, "loss": 0.7477, "step": 990 }, { "epoch": 0.9482758620689655, "loss_full_dim": 0.3333336114883423, "loss_main": 0.6825194954872131, "loss_parscale": 0.6875, "loss_sub_dim": 0.34918588399887085, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.9921875, "step": 990 }, { "epoch": 0.9492337164750958, "grad_norm": 7.070592403411865, "learning_rate": 2.655263157894737e-06, "loss": 0.6825, "step": 991 }, { "epoch": 0.9492337164750958, "loss_full_dim": 0.3375544548034668, "loss_main": 0.6907137632369995, "loss_parscale": 0.6953125, "loss_sub_dim": 0.3531592786312103, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.984375, "step": 991 }, { "epoch": 0.9501915708812261, "grad_norm": 9.032967567443848, "learning_rate": 2.652631578947369e-06, "loss": 0.6907, "step": 992 }, { "epoch": 0.9501915708812261, "loss_full_dim": 0.3293716609477997, "loss_main": 0.6749327182769775, "loss_parscale": 0.6796875, "loss_sub_dim": 0.34556102752685547, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.9921875, "step": 992 }, { "epoch": 0.9511494252873564, "grad_norm": 12.110572814941406, "learning_rate": 2.6500000000000005e-06, "loss": 0.6749, "step": 993 }, { "epoch": 0.9511494252873564, "loss_full_dim": 0.3572593033313751, "loss_main": 0.7287373542785645, "loss_parscale": 0.734375, "loss_sub_dim": 0.37147802114486694, "loss_vclub": 0.000667572021484375, "parscale_sim": 0.984375, "step": 993 }, { "epoch": 0.9521072796934866, "grad_norm": 7.7538981437683105, "learning_rate": 2.6473684210526316e-06, "loss": 0.7287, "step": 994 }, { "epoch": 0.9521072796934866, "loss_full_dim": 0.3202475309371948, "loss_main": 0.656971275806427, "loss_parscale": 0.65625, "loss_sub_dim": 0.3367237448692322, "loss_vclub": 0.000812530517578125, "parscale_sim": 0.984375, "step": 994 }, { "epoch": 0.9530651340996169, "grad_norm": 8.05822467803955, "learning_rate": 2.644736842105263e-06, "loss": 0.657, "step": 995 }, { "epoch": 0.9530651340996169, "loss_full_dim": 0.32426372170448303, "loss_main": 0.6636141538619995, "loss_parscale": 0.6640625, "loss_sub_dim": 0.3393504023551941, "loss_vclub": 0.000637054443359375, "parscale_sim": 0.984375, "step": 995 }, { "epoch": 0.9540229885057471, "grad_norm": 7.138598918914795, "learning_rate": 2.6421052631578948e-06, "loss": 0.6636, "step": 996 }, { "epoch": 0.9540229885057471, "loss_full_dim": 0.35446399450302124, "loss_main": 0.727826714515686, "loss_parscale": 0.72265625, "loss_sub_dim": 0.3733627200126648, "loss_vclub": 0.00091552734375, "parscale_sim": 0.98828125, "step": 996 }, { "epoch": 0.9549808429118773, "grad_norm": 6.907897472381592, "learning_rate": 2.639473684210527e-06, "loss": 0.7278, "step": 997 }, { "epoch": 0.9549808429118773, "loss_full_dim": 0.38206326961517334, "loss_main": 0.7799621820449829, "loss_parscale": 0.78125, "loss_sub_dim": 0.39789891242980957, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.98828125, "step": 997 }, { "epoch": 0.9559386973180076, "grad_norm": 15.352213859558105, "learning_rate": 2.6368421052631584e-06, "loss": 0.78, "step": 998 }, { "epoch": 0.9559386973180076, "loss_full_dim": 0.386430948972702, "loss_main": 0.7937735319137573, "loss_parscale": 0.796875, "loss_sub_dim": 0.4073426127433777, "loss_vclub": 0.00054931640625, "parscale_sim": 0.984375, "step": 998 }, { "epoch": 0.9568965517241379, "grad_norm": 42.56093215942383, "learning_rate": 2.6342105263157895e-06, "loss": 0.7938, "step": 999 }, { "epoch": 0.9568965517241379, "loss_full_dim": 0.29308241605758667, "loss_main": 0.6000210046768188, "loss_parscale": 0.59375, "loss_sub_dim": 0.30693861842155457, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.98828125, "step": 999 }, { "epoch": 0.9578544061302682, "grad_norm": 12.927788734436035, "learning_rate": 2.631578947368421e-06, "loss": 0.6, "step": 1000 }, { "epoch": 0.9578544061302682, "loss_full_dim": 0.3740207552909851, "loss_main": 0.7649590969085693, "loss_parscale": 0.7734375, "loss_sub_dim": 0.39093834161758423, "loss_vclub": 0.000850677490234375, "parscale_sim": 0.984375, "step": 1000 }, { "epoch": 0.9588122605363985, "grad_norm": 7.863142490386963, "learning_rate": 2.6289473684210527e-06, "loss": 0.765, "step": 1001 }, { "epoch": 0.9588122605363985, "loss_full_dim": 0.25263652205467224, "loss_main": 0.5193809270858765, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26674437522888184, "loss_vclub": 0.000762939453125, "parscale_sim": 0.984375, "step": 1001 }, { "epoch": 0.9597701149425287, "grad_norm": 6.340612888336182, "learning_rate": 2.6263157894736847e-06, "loss": 0.5194, "step": 1002 }, { "epoch": 0.9597701149425287, "loss_full_dim": 0.34443584084510803, "loss_main": 0.7055114507675171, "loss_parscale": 0.70703125, "loss_sub_dim": 0.36107563972473145, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.984375, "step": 1002 }, { "epoch": 0.960727969348659, "grad_norm": 8.460693359375, "learning_rate": 2.623684210526316e-06, "loss": 0.7055, "step": 1003 }, { "epoch": 0.960727969348659, "loss_full_dim": 0.2769145965576172, "loss_main": 0.5683712959289551, "loss_parscale": 0.578125, "loss_sub_dim": 0.2914566993713379, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.984375, "step": 1003 }, { "epoch": 0.9616858237547893, "grad_norm": 8.606009483337402, "learning_rate": 2.6210526315789474e-06, "loss": 0.5684, "step": 1004 }, { "epoch": 0.9616858237547893, "loss_full_dim": 0.3748375177383423, "loss_main": 0.7656341195106506, "loss_parscale": 0.76171875, "loss_sub_dim": 0.39079660177230835, "loss_vclub": 0.000934600830078125, "parscale_sim": 0.98828125, "step": 1004 }, { "epoch": 0.9626436781609196, "grad_norm": 5.558459758758545, "learning_rate": 2.618421052631579e-06, "loss": 0.7656, "step": 1005 }, { "epoch": 0.9626436781609196, "loss_full_dim": 0.3418247699737549, "loss_main": 0.6991864442825317, "loss_parscale": 0.6953125, "loss_sub_dim": 0.35736167430877686, "loss_vclub": 0.000804901123046875, "parscale_sim": 0.984375, "step": 1005 }, { "epoch": 0.9636015325670498, "grad_norm": 9.767403602600098, "learning_rate": 2.615789473684211e-06, "loss": 0.6992, "step": 1006 }, { "epoch": 0.9636015325670498, "loss_full_dim": 0.33708256483078003, "loss_main": 0.6907483339309692, "loss_parscale": 0.6953125, "loss_sub_dim": 0.3536657691001892, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.98828125, "step": 1006 }, { "epoch": 0.9645593869731801, "grad_norm": 8.17249870300293, "learning_rate": 2.6131578947368426e-06, "loss": 0.6907, "step": 1007 }, { "epoch": 0.9645593869731801, "loss_full_dim": 0.37216129899024963, "loss_main": 0.760851263999939, "loss_parscale": 0.7578125, "loss_sub_dim": 0.38868993520736694, "loss_vclub": 0.000579833984375, "parscale_sim": 0.9765625, "step": 1007 }, { "epoch": 0.9655172413793104, "grad_norm": 8.179460525512695, "learning_rate": 2.6105263157894738e-06, "loss": 0.7609, "step": 1008 }, { "epoch": 0.9655172413793104, "loss_full_dim": 0.35058924555778503, "loss_main": 0.7182965278625488, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3677073121070862, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98828125, "step": 1008 }, { "epoch": 0.9664750957854407, "grad_norm": 9.470303535461426, "learning_rate": 2.6078947368421053e-06, "loss": 0.7183, "step": 1009 }, { "epoch": 0.9664750957854407, "loss_full_dim": 0.3110802471637726, "loss_main": 0.6386126279830933, "loss_parscale": 0.6328125, "loss_sub_dim": 0.3275323510169983, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.98046875, "step": 1009 }, { "epoch": 0.9674329501915708, "grad_norm": 5.674261569976807, "learning_rate": 2.605263157894737e-06, "loss": 0.6386, "step": 1010 }, { "epoch": 0.9674329501915708, "loss_full_dim": 0.32219505310058594, "loss_main": 0.6579867601394653, "loss_parscale": 0.65625, "loss_sub_dim": 0.3357917070388794, "loss_vclub": 0.000701904296875, "parscale_sim": 0.98046875, "step": 1010 }, { "epoch": 0.9683908045977011, "grad_norm": 10.28763484954834, "learning_rate": 2.602631578947369e-06, "loss": 0.658, "step": 1011 }, { "epoch": 0.9683908045977011, "loss_full_dim": 0.3206019401550293, "loss_main": 0.6583316326141357, "loss_parscale": 0.66015625, "loss_sub_dim": 0.33772969245910645, "loss_vclub": 0.00081634521484375, "parscale_sim": 0.98828125, "step": 1011 }, { "epoch": 0.9693486590038314, "grad_norm": 7.315009117126465, "learning_rate": 2.6e-06, "loss": 0.6583, "step": 1012 }, { "epoch": 0.9693486590038314, "loss_full_dim": 0.36109673976898193, "loss_main": 0.7388482689857483, "loss_parscale": 0.7421875, "loss_sub_dim": 0.37775152921676636, "loss_vclub": 0.0006103515625, "parscale_sim": 0.984375, "step": 1012 }, { "epoch": 0.9703065134099617, "grad_norm": 7.8263421058654785, "learning_rate": 2.5973684210526317e-06, "loss": 0.7388, "step": 1013 }, { "epoch": 0.9703065134099617, "loss_full_dim": 0.3310362994670868, "loss_main": 0.6769050359725952, "loss_parscale": 0.671875, "loss_sub_dim": 0.3458687663078308, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.98828125, "step": 1013 }, { "epoch": 0.9712643678160919, "grad_norm": 7.194970607757568, "learning_rate": 2.5947368421052633e-06, "loss": 0.6769, "step": 1014 }, { "epoch": 0.9712643678160919, "loss_full_dim": 0.31934675574302673, "loss_main": 0.654855489730835, "loss_parscale": 0.65625, "loss_sub_dim": 0.3355087637901306, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.984375, "step": 1014 }, { "epoch": 0.9722222222222222, "grad_norm": 4.845890522003174, "learning_rate": 2.592105263157895e-06, "loss": 0.6549, "step": 1015 }, { "epoch": 0.9722222222222222, "loss_full_dim": 0.2881622910499573, "loss_main": 0.5905275940895081, "loss_parscale": 0.58984375, "loss_sub_dim": 0.3023653030395508, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.984375, "step": 1015 }, { "epoch": 0.9731800766283525, "grad_norm": 6.800598621368408, "learning_rate": 2.589473684210527e-06, "loss": 0.5905, "step": 1016 }, { "epoch": 0.9731800766283525, "loss_full_dim": 0.3401682674884796, "loss_main": 0.6969257593154907, "loss_parscale": 0.69921875, "loss_sub_dim": 0.3567575216293335, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.9765625, "step": 1016 }, { "epoch": 0.9741379310344828, "grad_norm": 15.006307601928711, "learning_rate": 2.586842105263158e-06, "loss": 0.6969, "step": 1017 }, { "epoch": 0.9741379310344828, "loss_full_dim": 0.32969245314598083, "loss_main": 0.6768120527267456, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3471195697784424, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.984375, "step": 1017 }, { "epoch": 0.975095785440613, "grad_norm": 6.725327491760254, "learning_rate": 2.5842105263157896e-06, "loss": 0.6768, "step": 1018 }, { "epoch": 0.975095785440613, "loss_full_dim": 0.37321269512176514, "loss_main": 0.761672854423523, "loss_parscale": 0.76171875, "loss_sub_dim": 0.3884601593017578, "loss_vclub": 0.0005035400390625, "parscale_sim": 0.94140625, "step": 1018 }, { "epoch": 0.9760536398467433, "grad_norm": 7.004549026489258, "learning_rate": 2.581578947368421e-06, "loss": 0.7617, "step": 1019 }, { "epoch": 0.9760536398467433, "loss_full_dim": 0.27583742141723633, "loss_main": 0.5662475228309631, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2904101014137268, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.98828125, "step": 1019 }, { "epoch": 0.9770114942528736, "grad_norm": 7.728745937347412, "learning_rate": 2.578947368421053e-06, "loss": 0.5662, "step": 1020 }, { "epoch": 0.9770114942528736, "loss_full_dim": 0.35915663838386536, "loss_main": 0.7335207462310791, "loss_parscale": 0.7421875, "loss_sub_dim": 0.37436413764953613, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.9765625, "step": 1020 }, { "epoch": 0.9779693486590039, "grad_norm": 8.699751853942871, "learning_rate": 2.5763157894736848e-06, "loss": 0.7335, "step": 1021 }, { "epoch": 0.9779693486590039, "loss_full_dim": 0.29712387919425964, "loss_main": 0.6102212071418762, "loss_parscale": 0.6015625, "loss_sub_dim": 0.3130973279476166, "loss_vclub": 0.0005950927734375, "parscale_sim": 0.96484375, "step": 1021 }, { "epoch": 0.9789272030651341, "grad_norm": 21.016529083251953, "learning_rate": 2.573684210526316e-06, "loss": 0.6102, "step": 1022 }, { "epoch": 0.9789272030651341, "loss_full_dim": 0.3358205556869507, "loss_main": 0.686116635799408, "loss_parscale": 0.69140625, "loss_sub_dim": 0.3502960801124573, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.984375, "step": 1022 }, { "epoch": 0.9798850574712644, "grad_norm": 9.111051559448242, "learning_rate": 2.5710526315789475e-06, "loss": 0.6861, "step": 1023 }, { "epoch": 0.9798850574712644, "loss_full_dim": 0.3144826292991638, "loss_main": 0.6426064968109131, "loss_parscale": 0.63671875, "loss_sub_dim": 0.32812386751174927, "loss_vclub": 0.00067138671875, "parscale_sim": 0.98828125, "step": 1023 }, { "epoch": 0.9808429118773946, "grad_norm": 8.319169044494629, "learning_rate": 2.568421052631579e-06, "loss": 0.6426, "step": 1024 }, { "epoch": 0.9808429118773946, "loss_full_dim": 0.3581685721874237, "loss_main": 0.7364161014556885, "loss_parscale": 0.7421875, "loss_sub_dim": 0.37824752926826477, "loss_vclub": 0.00066375732421875, "parscale_sim": 0.98046875, "step": 1024 }, { "epoch": 0.9818007662835249, "grad_norm": 10.637943267822266, "learning_rate": 2.565789473684211e-06, "loss": 0.7364, "step": 1025 }, { "epoch": 0.9818007662835249, "loss_full_dim": 0.30944567918777466, "loss_main": 0.6351810693740845, "loss_parscale": 0.6484375, "loss_sub_dim": 0.3257354199886322, "loss_vclub": 0.000629425048828125, "parscale_sim": 0.98828125, "step": 1025 }, { "epoch": 0.9827586206896551, "grad_norm": 6.258913993835449, "learning_rate": 2.5631578947368422e-06, "loss": 0.6352, "step": 1026 }, { "epoch": 0.9827586206896551, "loss_full_dim": 0.3508647680282593, "loss_main": 0.7168915271759033, "loss_parscale": 0.71484375, "loss_sub_dim": 0.36602678894996643, "loss_vclub": 0.000789642333984375, "parscale_sim": 0.98828125, "step": 1026 }, { "epoch": 0.9837164750957854, "grad_norm": 10.544301986694336, "learning_rate": 2.560526315789474e-06, "loss": 0.7169, "step": 1027 }, { "epoch": 0.9837164750957854, "loss_full_dim": 0.35448262095451355, "loss_main": 0.7219586372375488, "loss_parscale": 0.72265625, "loss_sub_dim": 0.3674759864807129, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.98828125, "step": 1027 }, { "epoch": 0.9846743295019157, "grad_norm": 8.300171852111816, "learning_rate": 2.5578947368421054e-06, "loss": 0.722, "step": 1028 }, { "epoch": 0.9846743295019157, "loss_full_dim": 0.32753467559814453, "loss_main": 0.671184241771698, "loss_parscale": 0.67578125, "loss_sub_dim": 0.34364956617355347, "loss_vclub": 0.000667572021484375, "parscale_sim": 0.9765625, "step": 1028 }, { "epoch": 0.985632183908046, "grad_norm": 6.589667797088623, "learning_rate": 2.555263157894737e-06, "loss": 0.6712, "step": 1029 }, { "epoch": 0.985632183908046, "loss_full_dim": 0.30752187967300415, "loss_main": 0.6307042837142944, "loss_parscale": 0.63671875, "loss_sub_dim": 0.3231824040412903, "loss_vclub": 0.0006256103515625, "parscale_sim": 0.984375, "step": 1029 }, { "epoch": 0.9865900383141762, "grad_norm": 8.620007514953613, "learning_rate": 2.552631578947369e-06, "loss": 0.6307, "step": 1030 }, { "epoch": 0.9865900383141762, "loss_full_dim": 0.3940610885620117, "loss_main": 0.8051474690437317, "loss_parscale": 0.8046875, "loss_sub_dim": 0.41108638048171997, "loss_vclub": 0.000823974609375, "parscale_sim": 0.98828125, "step": 1030 }, { "epoch": 0.9875478927203065, "grad_norm": 10.651994705200195, "learning_rate": 2.55e-06, "loss": 0.8051, "step": 1031 }, { "epoch": 0.9875478927203065, "loss_full_dim": 0.32489535212516785, "loss_main": 0.6670143604278564, "loss_parscale": 0.671875, "loss_sub_dim": 0.3421189785003662, "loss_vclub": 0.00051116943359375, "parscale_sim": 0.984375, "step": 1031 }, { "epoch": 0.9885057471264368, "grad_norm": 6.365133762359619, "learning_rate": 2.5473684210526317e-06, "loss": 0.667, "step": 1032 }, { "epoch": 0.9885057471264368, "loss_full_dim": 0.31626513600349426, "loss_main": 0.6483741998672485, "loss_parscale": 0.66015625, "loss_sub_dim": 0.3321090638637543, "loss_vclub": 0.000873565673828125, "parscale_sim": 0.984375, "step": 1032 }, { "epoch": 0.9894636015325671, "grad_norm": 19.413860321044922, "learning_rate": 2.5447368421052633e-06, "loss": 0.6484, "step": 1033 }, { "epoch": 0.9894636015325671, "loss_full_dim": 0.3540390133857727, "loss_main": 0.7224035263061523, "loss_parscale": 0.7265625, "loss_sub_dim": 0.368364542722702, "loss_vclub": 0.00072479248046875, "parscale_sim": 0.98828125, "step": 1033 }, { "epoch": 0.9904214559386973, "grad_norm": 9.097983360290527, "learning_rate": 2.5421052631578953e-06, "loss": 0.7224, "step": 1034 }, { "epoch": 0.9904214559386973, "loss_full_dim": 0.3117077946662903, "loss_main": 0.6384835839271545, "loss_parscale": 0.65234375, "loss_sub_dim": 0.32677578926086426, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.96484375, "step": 1034 }, { "epoch": 0.9913793103448276, "grad_norm": 11.005003929138184, "learning_rate": 2.5394736842105265e-06, "loss": 0.6385, "step": 1035 }, { "epoch": 0.9913793103448276, "loss_full_dim": 0.3159809410572052, "loss_main": 0.650222659111023, "loss_parscale": 0.6484375, "loss_sub_dim": 0.33424174785614014, "loss_vclub": 0.00060272216796875, "parscale_sim": 0.98046875, "step": 1035 }, { "epoch": 0.9923371647509579, "grad_norm": 7.874431133270264, "learning_rate": 2.536842105263158e-06, "loss": 0.6502, "step": 1036 }, { "epoch": 0.9923371647509579, "loss_full_dim": 0.331870973110199, "loss_main": 0.6794376373291016, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3475666642189026, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.98828125, "step": 1036 }, { "epoch": 0.9932950191570882, "grad_norm": 6.247976779937744, "learning_rate": 2.5342105263157896e-06, "loss": 0.6794, "step": 1037 }, { "epoch": 0.9932950191570882, "loss_full_dim": 0.36095544695854187, "loss_main": 0.738528847694397, "loss_parscale": 0.75, "loss_sub_dim": 0.3775734305381775, "loss_vclub": 0.0006103515625, "parscale_sim": 0.98828125, "step": 1037 }, { "epoch": 0.9942528735632183, "grad_norm": 9.80421257019043, "learning_rate": 2.5315789473684212e-06, "loss": 0.7385, "step": 1038 }, { "epoch": 0.9942528735632183, "loss_full_dim": 0.3386712670326233, "loss_main": 0.6922721862792969, "loss_parscale": 0.69921875, "loss_sub_dim": 0.3536009192466736, "loss_vclub": 0.000865936279296875, "parscale_sim": 0.98828125, "step": 1038 }, { "epoch": 0.9952107279693486, "grad_norm": 6.2984700202941895, "learning_rate": 2.5289473684210532e-06, "loss": 0.6923, "step": 1039 }, { "epoch": 0.9952107279693486, "loss_full_dim": 0.3551914393901825, "loss_main": 0.728070080280304, "loss_parscale": 0.7265625, "loss_sub_dim": 0.37287864089012146, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98828125, "step": 1039 }, { "epoch": 0.9961685823754789, "grad_norm": 6.366806507110596, "learning_rate": 2.5263157894736844e-06, "loss": 0.7281, "step": 1040 }, { "epoch": 0.9961685823754789, "loss_full_dim": 0.2976182997226715, "loss_main": 0.6102093458175659, "loss_parscale": 0.609375, "loss_sub_dim": 0.312591016292572, "loss_vclub": 0.000621795654296875, "parscale_sim": 0.984375, "step": 1040 }, { "epoch": 0.9971264367816092, "grad_norm": 47.501625061035156, "learning_rate": 2.523684210526316e-06, "loss": 0.6102, "step": 1041 }, { "epoch": 0.9971264367816092, "loss_full_dim": 0.4209270179271698, "loss_main": 0.8560537099838257, "loss_parscale": 0.8515625, "loss_sub_dim": 0.4351266622543335, "loss_vclub": 0.00084686279296875, "parscale_sim": 0.96875, "step": 1041 }, { "epoch": 0.9980842911877394, "grad_norm": 17.489656448364258, "learning_rate": 2.5210526315789475e-06, "loss": 0.8561, "step": 1042 }, { "epoch": 0.9980842911877394, "loss_full_dim": 0.3164657950401306, "loss_main": 0.653298020362854, "loss_parscale": 0.65234375, "loss_sub_dim": 0.3368322551250458, "loss_vclub": 0.000667572021484375, "parscale_sim": 0.96484375, "step": 1042 }, { "epoch": 0.9990421455938697, "grad_norm": 7.43805456161499, "learning_rate": 2.5184210526315787e-06, "loss": 0.6533, "step": 1043 }, { "epoch": 0.9990421455938697, "loss_full_dim": 0.32677680253982544, "loss_main": 0.6681444048881531, "loss_parscale": 0.6640625, "loss_sub_dim": 0.34136760234832764, "loss_vclub": 0.000720977783203125, "parscale_sim": 0.984375, "step": 1043 }, { "epoch": 1.0, "grad_norm": 119.0500259399414, "learning_rate": 2.5157894736842107e-06, "loss": 0.6681, "step": 1044 }, { "epoch": 1.0, "loss_full_dim": 0.3530271351337433, "loss_main": 0.7213032245635986, "loss_parscale": 0.71484375, "loss_sub_dim": 0.36827605962753296, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.98046875, "step": 1044 }, { "epoch": 1.0009578544061302, "grad_norm": 7.65114164352417, "learning_rate": 2.5131578947368423e-06, "loss": 0.7213, "step": 1045 }, { "epoch": 1.0009578544061302, "loss_full_dim": 0.3293192982673645, "loss_main": 0.6711314916610718, "loss_parscale": 0.67578125, "loss_sub_dim": 0.34181222319602966, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98828125, "step": 1045 }, { "epoch": 1.0019157088122606, "grad_norm": 8.869820594787598, "learning_rate": 2.510526315789474e-06, "loss": 0.6711, "step": 1046 }, { "epoch": 1.0019157088122606, "loss_full_dim": 0.28301671147346497, "loss_main": 0.5829761028289795, "loss_parscale": 0.58984375, "loss_sub_dim": 0.29995936155319214, "loss_vclub": 0.00061798095703125, "parscale_sim": 0.98046875, "step": 1046 }, { "epoch": 1.0028735632183907, "grad_norm": 8.472345352172852, "learning_rate": 2.5078947368421055e-06, "loss": 0.583, "step": 1047 }, { "epoch": 1.0028735632183907, "loss_full_dim": 0.35564732551574707, "loss_main": 0.7272031903266907, "loss_parscale": 0.75, "loss_sub_dim": 0.3715558648109436, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.98046875, "step": 1047 }, { "epoch": 1.003831417624521, "grad_norm": 4.975111484527588, "learning_rate": 2.5052631578947375e-06, "loss": 0.7272, "step": 1048 }, { "epoch": 1.003831417624521, "loss_full_dim": 0.28641268610954285, "loss_main": 0.5849368572235107, "loss_parscale": 0.59375, "loss_sub_dim": 0.2985242009162903, "loss_vclub": 0.000640869140625, "parscale_sim": 0.984375, "step": 1048 }, { "epoch": 1.0047892720306513, "grad_norm": 9.309460639953613, "learning_rate": 2.5026315789473686e-06, "loss": 0.5849, "step": 1049 }, { "epoch": 1.0047892720306513, "loss_full_dim": 0.3882876932621002, "loss_main": 0.794133186340332, "loss_parscale": 0.796875, "loss_sub_dim": 0.4058454632759094, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.984375, "step": 1049 }, { "epoch": 1.0057471264367817, "grad_norm": 14.060222625732422, "learning_rate": 2.5e-06, "loss": 0.7941, "step": 1050 }, { "epoch": 1.0057471264367817, "loss_full_dim": 0.270906001329422, "loss_main": 0.5557749271392822, "loss_parscale": 0.56640625, "loss_sub_dim": 0.28486892580986023, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.98828125, "step": 1050 }, { "epoch": 1.0067049808429118, "grad_norm": 7.178454875946045, "learning_rate": 2.4973684210526318e-06, "loss": 0.5558, "step": 1051 }, { "epoch": 1.0067049808429118, "loss_full_dim": 0.31261467933654785, "loss_main": 0.6430388689041138, "loss_parscale": 0.64453125, "loss_sub_dim": 0.33042415976524353, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.98828125, "step": 1051 }, { "epoch": 1.0076628352490422, "grad_norm": 11.860182762145996, "learning_rate": 2.4947368421052634e-06, "loss": 0.643, "step": 1052 }, { "epoch": 1.0076628352490422, "loss_full_dim": 0.3329324424266815, "loss_main": 0.68244469165802, "loss_parscale": 0.6875, "loss_sub_dim": 0.3495122790336609, "loss_vclub": 0.00079345703125, "parscale_sim": 0.984375, "step": 1052 }, { "epoch": 1.0086206896551724, "grad_norm": 7.644833087921143, "learning_rate": 2.492105263157895e-06, "loss": 0.6824, "step": 1053 }, { "epoch": 1.0086206896551724, "loss_full_dim": 0.30288469791412354, "loss_main": 0.6233150959014893, "loss_parscale": 0.6171875, "loss_sub_dim": 0.3204304277896881, "loss_vclub": 0.000705718994140625, "parscale_sim": 0.98046875, "step": 1053 }, { "epoch": 1.0095785440613028, "grad_norm": 7.083981513977051, "learning_rate": 2.4894736842105265e-06, "loss": 0.6233, "step": 1054 }, { "epoch": 1.0095785440613028, "loss_full_dim": 0.33364373445510864, "loss_main": 0.6822822093963623, "loss_parscale": 0.671875, "loss_sub_dim": 0.34863850474357605, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.98046875, "step": 1054 }, { "epoch": 1.010536398467433, "grad_norm": 8.663122177124023, "learning_rate": 2.486842105263158e-06, "loss": 0.6823, "step": 1055 }, { "epoch": 1.010536398467433, "loss_full_dim": 0.33027076721191406, "loss_main": 0.6772358417510986, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3469650447368622, "loss_vclub": 0.00067138671875, "parscale_sim": 0.98046875, "step": 1055 }, { "epoch": 1.0114942528735633, "grad_norm": 11.3321533203125, "learning_rate": 2.4842105263157897e-06, "loss": 0.6772, "step": 1056 }, { "epoch": 1.0114942528735633, "loss_full_dim": 0.35001322627067566, "loss_main": 0.7161818742752075, "loss_parscale": 0.7265625, "loss_sub_dim": 0.3661686182022095, "loss_vclub": 0.00089263916015625, "parscale_sim": 0.98828125, "step": 1056 }, { "epoch": 1.0124521072796935, "grad_norm": 6.374368667602539, "learning_rate": 2.4815789473684213e-06, "loss": 0.7162, "step": 1057 }, { "epoch": 1.0124521072796935, "loss_full_dim": 0.2721157968044281, "loss_main": 0.5599921941757202, "loss_parscale": 0.55859375, "loss_sub_dim": 0.2878763973712921, "loss_vclub": 0.0006103515625, "parscale_sim": 0.984375, "step": 1057 }, { "epoch": 1.0134099616858236, "grad_norm": 8.139749526977539, "learning_rate": 2.478947368421053e-06, "loss": 0.56, "step": 1058 }, { "epoch": 1.0134099616858236, "loss_full_dim": 0.3163823187351227, "loss_main": 0.646822452545166, "loss_parscale": 0.65625, "loss_sub_dim": 0.3304401636123657, "loss_vclub": 0.000701904296875, "parscale_sim": 0.984375, "step": 1058 }, { "epoch": 1.014367816091954, "grad_norm": 8.288359642028809, "learning_rate": 2.4763157894736844e-06, "loss": 0.6468, "step": 1059 }, { "epoch": 1.014367816091954, "loss_full_dim": 0.3129429221153259, "loss_main": 0.640740156173706, "loss_parscale": 0.66015625, "loss_sub_dim": 0.3277972340583801, "loss_vclub": 0.000659942626953125, "parscale_sim": 0.984375, "step": 1059 }, { "epoch": 1.0153256704980842, "grad_norm": 7.348170280456543, "learning_rate": 2.473684210526316e-06, "loss": 0.6407, "step": 1060 }, { "epoch": 1.0153256704980842, "loss_full_dim": 0.32003501057624817, "loss_main": 0.6522905826568604, "loss_parscale": 0.65625, "loss_sub_dim": 0.3322555422782898, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.98828125, "step": 1060 }, { "epoch": 1.0162835249042146, "grad_norm": 7.609851837158203, "learning_rate": 2.4710526315789476e-06, "loss": 0.6523, "step": 1061 }, { "epoch": 1.0162835249042146, "loss_full_dim": 0.3019123673439026, "loss_main": 0.6216614246368408, "loss_parscale": 0.62890625, "loss_sub_dim": 0.31974905729293823, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98046875, "step": 1061 }, { "epoch": 1.0172413793103448, "grad_norm": 10.455229759216309, "learning_rate": 2.468421052631579e-06, "loss": 0.6217, "step": 1062 }, { "epoch": 1.0172413793103448, "loss_full_dim": 0.3063417971134186, "loss_main": 0.6307284832000732, "loss_parscale": 0.625, "loss_sub_dim": 0.3243866562843323, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.984375, "step": 1062 }, { "epoch": 1.0181992337164751, "grad_norm": 8.946558952331543, "learning_rate": 2.4657894736842108e-06, "loss": 0.6307, "step": 1063 }, { "epoch": 1.0181992337164751, "loss_full_dim": 0.30582135915756226, "loss_main": 0.627159595489502, "loss_parscale": 0.6328125, "loss_sub_dim": 0.3213382363319397, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.98828125, "step": 1063 }, { "epoch": 1.0191570881226053, "grad_norm": 12.497559547424316, "learning_rate": 2.4631578947368424e-06, "loss": 0.6272, "step": 1064 }, { "epoch": 1.0191570881226053, "loss_full_dim": 0.3278299570083618, "loss_main": 0.6710010766983032, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3431711196899414, "loss_vclub": 0.000942230224609375, "parscale_sim": 0.984375, "step": 1064 }, { "epoch": 1.0201149425287357, "grad_norm": 6.3675856590271, "learning_rate": 2.460526315789474e-06, "loss": 0.671, "step": 1065 }, { "epoch": 1.0201149425287357, "loss_full_dim": 0.2661485970020294, "loss_main": 0.5455708503723145, "loss_parscale": 0.546875, "loss_sub_dim": 0.27942222356796265, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.984375, "step": 1065 }, { "epoch": 1.0210727969348659, "grad_norm": 7.093329906463623, "learning_rate": 2.4578947368421055e-06, "loss": 0.5456, "step": 1066 }, { "epoch": 1.0210727969348659, "loss_full_dim": 0.3487899601459503, "loss_main": 0.7160317301750183, "loss_parscale": 0.72265625, "loss_sub_dim": 0.367241770029068, "loss_vclub": 0.000843048095703125, "parscale_sim": 0.98828125, "step": 1066 }, { "epoch": 1.0220306513409962, "grad_norm": 6.979436874389648, "learning_rate": 2.455263157894737e-06, "loss": 0.716, "step": 1067 }, { "epoch": 1.0220306513409962, "loss_full_dim": 0.2917635440826416, "loss_main": 0.5993779301643372, "loss_parscale": 0.6015625, "loss_sub_dim": 0.30761438608169556, "loss_vclub": 0.0006103515625, "parscale_sim": 0.984375, "step": 1067 }, { "epoch": 1.0229885057471264, "grad_norm": 6.843903064727783, "learning_rate": 2.4526315789473687e-06, "loss": 0.5994, "step": 1068 }, { "epoch": 1.0229885057471264, "loss_full_dim": 0.30615267157554626, "loss_main": 0.6253519058227539, "loss_parscale": 0.61328125, "loss_sub_dim": 0.31919923424720764, "loss_vclub": 0.000858306884765625, "parscale_sim": 0.984375, "step": 1068 }, { "epoch": 1.0239463601532568, "grad_norm": 6.738847732543945, "learning_rate": 2.4500000000000003e-06, "loss": 0.6254, "step": 1069 }, { "epoch": 1.0239463601532568, "loss_full_dim": 0.37328293919563293, "loss_main": 0.7670636773109436, "loss_parscale": 0.7578125, "loss_sub_dim": 0.39378073811531067, "loss_vclub": 0.000720977783203125, "parscale_sim": 0.95703125, "step": 1069 }, { "epoch": 1.024904214559387, "grad_norm": 83.12054443359375, "learning_rate": 2.447368421052632e-06, "loss": 0.7671, "step": 1070 }, { "epoch": 1.024904214559387, "loss_full_dim": 0.282988041639328, "loss_main": 0.582494854927063, "loss_parscale": 0.59765625, "loss_sub_dim": 0.2995067834854126, "loss_vclub": 0.000606536865234375, "parscale_sim": 0.984375, "step": 1070 }, { "epoch": 1.0258620689655173, "grad_norm": 15.562430381774902, "learning_rate": 2.4447368421052634e-06, "loss": 0.5825, "step": 1071 }, { "epoch": 1.0258620689655173, "loss_full_dim": 0.29707106947898865, "loss_main": 0.609855592250824, "loss_parscale": 0.625, "loss_sub_dim": 0.3127845227718353, "loss_vclub": 0.000644683837890625, "parscale_sim": 0.984375, "step": 1071 }, { "epoch": 1.0268199233716475, "grad_norm": 5.4329609870910645, "learning_rate": 2.442105263157895e-06, "loss": 0.6099, "step": 1072 }, { "epoch": 1.0268199233716475, "loss_full_dim": 0.3310766816139221, "loss_main": 0.6756995916366577, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3446229100227356, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.984375, "step": 1072 }, { "epoch": 1.0277777777777777, "grad_norm": 5.4154582023620605, "learning_rate": 2.4394736842105266e-06, "loss": 0.6757, "step": 1073 }, { "epoch": 1.0277777777777777, "loss_full_dim": 0.3382551074028015, "loss_main": 0.690826416015625, "loss_parscale": 0.69921875, "loss_sub_dim": 0.3525713384151459, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.984375, "step": 1073 }, { "epoch": 1.028735632183908, "grad_norm": 8.304079055786133, "learning_rate": 2.436842105263158e-06, "loss": 0.6908, "step": 1074 }, { "epoch": 1.028735632183908, "loss_full_dim": 0.31365635991096497, "loss_main": 0.642986536026001, "loss_parscale": 0.6484375, "loss_sub_dim": 0.3293301463127136, "loss_vclub": 0.00057220458984375, "parscale_sim": 0.98046875, "step": 1074 }, { "epoch": 1.0296934865900382, "grad_norm": 6.770873069763184, "learning_rate": 2.4342105263157898e-06, "loss": 0.643, "step": 1075 }, { "epoch": 1.0296934865900382, "loss_full_dim": 0.2594923973083496, "loss_main": 0.5349768400192261, "loss_parscale": 0.546875, "loss_sub_dim": 0.2754844129085541, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.98828125, "step": 1075 }, { "epoch": 1.0306513409961686, "grad_norm": 7.837041854858398, "learning_rate": 2.4315789473684213e-06, "loss": 0.535, "step": 1076 }, { "epoch": 1.0306513409961686, "loss_full_dim": 0.27727532386779785, "loss_main": 0.5713865756988525, "loss_parscale": 0.56640625, "loss_sub_dim": 0.2941112518310547, "loss_vclub": 0.000637054443359375, "parscale_sim": 0.98046875, "step": 1076 }, { "epoch": 1.0316091954022988, "grad_norm": 13.960162162780762, "learning_rate": 2.428947368421053e-06, "loss": 0.5714, "step": 1077 }, { "epoch": 1.0316091954022988, "loss_full_dim": 0.32073676586151123, "loss_main": 0.6591898798942566, "loss_parscale": 0.67578125, "loss_sub_dim": 0.33845311403274536, "loss_vclub": 0.000911712646484375, "parscale_sim": 0.98828125, "step": 1077 }, { "epoch": 1.0325670498084292, "grad_norm": 7.915101528167725, "learning_rate": 2.4263157894736845e-06, "loss": 0.6592, "step": 1078 }, { "epoch": 1.0325670498084292, "loss_full_dim": 0.28864097595214844, "loss_main": 0.5933150053024292, "loss_parscale": 0.59375, "loss_sub_dim": 0.30467402935028076, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.984375, "step": 1078 }, { "epoch": 1.0335249042145593, "grad_norm": 5.741289138793945, "learning_rate": 2.4236842105263157e-06, "loss": 0.5933, "step": 1079 }, { "epoch": 1.0335249042145593, "loss_full_dim": 0.3223423361778259, "loss_main": 0.6623326539993286, "loss_parscale": 0.6640625, "loss_sub_dim": 0.3399903178215027, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.984375, "step": 1079 }, { "epoch": 1.0344827586206897, "grad_norm": 9.532543182373047, "learning_rate": 2.4210526315789477e-06, "loss": 0.6623, "step": 1080 }, { "epoch": 1.0344827586206897, "loss_full_dim": 0.3373677134513855, "loss_main": 0.6918318271636963, "loss_parscale": 0.68359375, "loss_sub_dim": 0.3544641435146332, "loss_vclub": 0.000690460205078125, "parscale_sim": 0.98828125, "step": 1080 }, { "epoch": 1.03544061302682, "grad_norm": 7.012970447540283, "learning_rate": 2.4184210526315792e-06, "loss": 0.6918, "step": 1081 }, { "epoch": 1.03544061302682, "loss_full_dim": 0.2931044101715088, "loss_main": 0.5998208522796631, "loss_parscale": 0.60546875, "loss_sub_dim": 0.3067164123058319, "loss_vclub": 0.000640869140625, "parscale_sim": 0.984375, "step": 1081 }, { "epoch": 1.0363984674329503, "grad_norm": 9.505379676818848, "learning_rate": 2.415789473684211e-06, "loss": 0.5998, "step": 1082 }, { "epoch": 1.0363984674329503, "loss_full_dim": 0.30418258905410767, "loss_main": 0.6232550740242004, "loss_parscale": 0.62890625, "loss_sub_dim": 0.3190724849700928, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.98828125, "step": 1082 }, { "epoch": 1.0373563218390804, "grad_norm": 7.541578769683838, "learning_rate": 2.4131578947368424e-06, "loss": 0.6233, "step": 1083 }, { "epoch": 1.0373563218390804, "loss_full_dim": 0.2606891393661499, "loss_main": 0.5349851846694946, "loss_parscale": 0.5390625, "loss_sub_dim": 0.2742960453033447, "loss_vclub": 0.000797271728515625, "parscale_sim": 0.984375, "step": 1083 }, { "epoch": 1.0383141762452108, "grad_norm": 8.005407333374023, "learning_rate": 2.410526315789474e-06, "loss": 0.535, "step": 1084 }, { "epoch": 1.0383141762452108, "loss_full_dim": 0.27433472871780396, "loss_main": 0.5611346960067749, "loss_parscale": 0.56640625, "loss_sub_dim": 0.28679996728897095, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.984375, "step": 1084 }, { "epoch": 1.039272030651341, "grad_norm": 5.120755195617676, "learning_rate": 2.4078947368421056e-06, "loss": 0.5611, "step": 1085 }, { "epoch": 1.039272030651341, "loss_full_dim": 0.32063695788383484, "loss_main": 0.6544971466064453, "loss_parscale": 0.65234375, "loss_sub_dim": 0.3338601589202881, "loss_vclub": 0.000919342041015625, "parscale_sim": 0.98828125, "step": 1085 }, { "epoch": 1.0402298850574712, "grad_norm": 8.546975135803223, "learning_rate": 2.4052631578947367e-06, "loss": 0.6545, "step": 1086 }, { "epoch": 1.0402298850574712, "loss_full_dim": 0.2907300591468811, "loss_main": 0.5967634916305542, "loss_parscale": 0.59765625, "loss_sub_dim": 0.3060334324836731, "loss_vclub": 0.000865936279296875, "parscale_sim": 0.98828125, "step": 1086 }, { "epoch": 1.0411877394636015, "grad_norm": 6.22186803817749, "learning_rate": 2.4026315789473687e-06, "loss": 0.5968, "step": 1087 }, { "epoch": 1.0411877394636015, "loss_full_dim": 0.32470428943634033, "loss_main": 0.6665542125701904, "loss_parscale": 0.671875, "loss_sub_dim": 0.3418498933315277, "loss_vclub": 0.00063323974609375, "parscale_sim": 0.984375, "step": 1087 }, { "epoch": 1.0421455938697317, "grad_norm": 10.674186706542969, "learning_rate": 2.4000000000000003e-06, "loss": 0.6666, "step": 1088 }, { "epoch": 1.0421455938697317, "loss_full_dim": 0.28362858295440674, "loss_main": 0.583790123462677, "loss_parscale": 0.5859375, "loss_sub_dim": 0.30016154050827026, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.98046875, "step": 1088 }, { "epoch": 1.043103448275862, "grad_norm": 14.707611083984375, "learning_rate": 2.397368421052632e-06, "loss": 0.5838, "step": 1089 }, { "epoch": 1.043103448275862, "loss_full_dim": 0.3575120270252228, "loss_main": 0.7320400476455688, "loss_parscale": 0.73828125, "loss_sub_dim": 0.37452802062034607, "loss_vclub": 0.000606536865234375, "parscale_sim": 0.98828125, "step": 1089 }, { "epoch": 1.0440613026819923, "grad_norm": 9.62270736694336, "learning_rate": 2.3947368421052635e-06, "loss": 0.732, "step": 1090 }, { "epoch": 1.0440613026819923, "loss_full_dim": 0.32574400305747986, "loss_main": 0.6680026054382324, "loss_parscale": 0.68359375, "loss_sub_dim": 0.34225863218307495, "loss_vclub": 0.0006256103515625, "parscale_sim": 0.9609375, "step": 1090 }, { "epoch": 1.0450191570881227, "grad_norm": 7.991005897521973, "learning_rate": 2.392105263157895e-06, "loss": 0.668, "step": 1091 }, { "epoch": 1.0450191570881227, "loss_full_dim": 0.3078005611896515, "loss_main": 0.6322445869445801, "loss_parscale": 0.62109375, "loss_sub_dim": 0.3244440257549286, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.98828125, "step": 1091 }, { "epoch": 1.0459770114942528, "grad_norm": 9.041596412658691, "learning_rate": 2.3894736842105266e-06, "loss": 0.6322, "step": 1092 }, { "epoch": 1.0459770114942528, "loss_full_dim": 0.31405210494995117, "loss_main": 0.6434261202812195, "loss_parscale": 0.6484375, "loss_sub_dim": 0.3293740153312683, "loss_vclub": 0.0006103515625, "parscale_sim": 0.984375, "step": 1092 }, { "epoch": 1.0469348659003832, "grad_norm": 7.409630298614502, "learning_rate": 2.386842105263158e-06, "loss": 0.6434, "step": 1093 }, { "epoch": 1.0469348659003832, "loss_full_dim": 0.2524268627166748, "loss_main": 0.5205960273742676, "loss_parscale": 0.53125, "loss_sub_dim": 0.26816919445991516, "loss_vclub": 0.0006256103515625, "parscale_sim": 0.984375, "step": 1093 }, { "epoch": 1.0478927203065134, "grad_norm": 4.7804951667785645, "learning_rate": 2.38421052631579e-06, "loss": 0.5206, "step": 1094 }, { "epoch": 1.0478927203065134, "loss_full_dim": 0.30824652314186096, "loss_main": 0.6314982175827026, "loss_parscale": 0.6328125, "loss_sub_dim": 0.3232516646385193, "loss_vclub": 0.000797271728515625, "parscale_sim": 0.98046875, "step": 1094 }, { "epoch": 1.0488505747126438, "grad_norm": 4.680675983428955, "learning_rate": 2.381578947368421e-06, "loss": 0.6315, "step": 1095 }, { "epoch": 1.0488505747126438, "loss_full_dim": 0.319039911031723, "loss_main": 0.6533815860748291, "loss_parscale": 0.6484375, "loss_sub_dim": 0.33434170484542847, "loss_vclub": 0.000591278076171875, "parscale_sim": 0.984375, "step": 1095 }, { "epoch": 1.049808429118774, "grad_norm": 5.931984901428223, "learning_rate": 2.378947368421053e-06, "loss": 0.6534, "step": 1096 }, { "epoch": 1.049808429118774, "loss_full_dim": 0.24160286784172058, "loss_main": 0.49548348784446716, "loss_parscale": 0.5, "loss_sub_dim": 0.2538806200027466, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.98828125, "step": 1096 }, { "epoch": 1.0507662835249043, "grad_norm": 7.5706963539123535, "learning_rate": 2.3763157894736846e-06, "loss": 0.4955, "step": 1097 }, { "epoch": 1.0507662835249043, "loss_full_dim": 0.32297417521476746, "loss_main": 0.6612062454223633, "loss_parscale": 0.65234375, "loss_sub_dim": 0.3382320702075958, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.984375, "step": 1097 }, { "epoch": 1.0517241379310345, "grad_norm": 13.759417533874512, "learning_rate": 2.373684210526316e-06, "loss": 0.6612, "step": 1098 }, { "epoch": 1.0517241379310345, "loss_full_dim": 0.31783437728881836, "loss_main": 0.6500334143638611, "loss_parscale": 0.64453125, "loss_sub_dim": 0.3321990370750427, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.98828125, "step": 1098 }, { "epoch": 1.0526819923371646, "grad_norm": 13.295684814453125, "learning_rate": 2.3710526315789477e-06, "loss": 0.65, "step": 1099 }, { "epoch": 1.0526819923371646, "loss_full_dim": 0.30159175395965576, "loss_main": 0.6161467432975769, "loss_parscale": 0.61328125, "loss_sub_dim": 0.31455498933792114, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.984375, "step": 1099 }, { "epoch": 1.053639846743295, "grad_norm": 7.551088333129883, "learning_rate": 2.368421052631579e-06, "loss": 0.6161, "step": 1100 }, { "epoch": 1.053639846743295, "loss_full_dim": 0.32558193802833557, "loss_main": 0.6649506092071533, "loss_parscale": 0.6796875, "loss_sub_dim": 0.33936870098114014, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.984375, "step": 1100 }, { "epoch": 1.0545977011494252, "grad_norm": 6.61984920501709, "learning_rate": 2.365789473684211e-06, "loss": 0.665, "step": 1101 }, { "epoch": 1.0545977011494252, "loss_full_dim": 0.2934441864490509, "loss_main": 0.601305365562439, "loss_parscale": 0.6015625, "loss_sub_dim": 0.3078611493110657, "loss_vclub": 0.00081634521484375, "parscale_sim": 0.984375, "step": 1101 }, { "epoch": 1.0555555555555556, "grad_norm": 4.769585132598877, "learning_rate": 2.363157894736842e-06, "loss": 0.6013, "step": 1102 }, { "epoch": 1.0555555555555556, "loss_full_dim": 0.3480132818222046, "loss_main": 0.7131646275520325, "loss_parscale": 0.71875, "loss_sub_dim": 0.3651513457298279, "loss_vclub": 0.0006103515625, "parscale_sim": 0.9609375, "step": 1102 }, { "epoch": 1.0565134099616857, "grad_norm": 11.557101249694824, "learning_rate": 2.360526315789474e-06, "loss": 0.7132, "step": 1103 }, { "epoch": 1.0565134099616857, "loss_full_dim": 0.27706924080848694, "loss_main": 0.5685737133026123, "loss_parscale": 0.5703125, "loss_sub_dim": 0.291504442691803, "loss_vclub": 0.000732421875, "parscale_sim": 0.98046875, "step": 1103 }, { "epoch": 1.0574712643678161, "grad_norm": 6.667210578918457, "learning_rate": 2.357894736842105e-06, "loss": 0.5686, "step": 1104 }, { "epoch": 1.0574712643678161, "loss_full_dim": 0.3539445996284485, "loss_main": 0.7237195372581482, "loss_parscale": 0.73046875, "loss_sub_dim": 0.3697749376296997, "loss_vclub": 0.000789642333984375, "parscale_sim": 0.98828125, "step": 1104 }, { "epoch": 1.0584291187739463, "grad_norm": 7.168417930603027, "learning_rate": 2.355263157894737e-06, "loss": 0.7237, "step": 1105 }, { "epoch": 1.0584291187739463, "loss_full_dim": 0.27320677042007446, "loss_main": 0.5586020946502686, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2853952944278717, "loss_vclub": 0.000820159912109375, "parscale_sim": 0.98046875, "step": 1105 }, { "epoch": 1.0593869731800767, "grad_norm": 28.423564910888672, "learning_rate": 2.352631578947369e-06, "loss": 0.5586, "step": 1106 }, { "epoch": 1.0593869731800767, "loss_full_dim": 0.3254897892475128, "loss_main": 0.6648943424224854, "loss_parscale": 0.671875, "loss_sub_dim": 0.3394045829772949, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.984375, "step": 1106 }, { "epoch": 1.0603448275862069, "grad_norm": 9.128947257995605, "learning_rate": 2.35e-06, "loss": 0.6649, "step": 1107 }, { "epoch": 1.0603448275862069, "loss_full_dim": 0.3276681900024414, "loss_main": 0.6694560050964355, "loss_parscale": 0.671875, "loss_sub_dim": 0.34178781509399414, "loss_vclub": 0.00072479248046875, "parscale_sim": 0.9765625, "step": 1107 }, { "epoch": 1.0613026819923372, "grad_norm": 7.381644248962402, "learning_rate": 2.347368421052632e-06, "loss": 0.6695, "step": 1108 }, { "epoch": 1.0613026819923372, "loss_full_dim": 0.28291139006614685, "loss_main": 0.579505205154419, "loss_parscale": 0.58203125, "loss_sub_dim": 0.2965937852859497, "loss_vclub": 0.00084686279296875, "parscale_sim": 0.984375, "step": 1108 }, { "epoch": 1.0622605363984674, "grad_norm": 6.367630958557129, "learning_rate": 2.344736842105263e-06, "loss": 0.5795, "step": 1109 }, { "epoch": 1.0622605363984674, "loss_full_dim": 0.32807278633117676, "loss_main": 0.6697877049446106, "loss_parscale": 0.671875, "loss_sub_dim": 0.34171491861343384, "loss_vclub": 0.000885009765625, "parscale_sim": 0.98828125, "step": 1109 }, { "epoch": 1.0632183908045978, "grad_norm": 7.964906215667725, "learning_rate": 2.342105263157895e-06, "loss": 0.6698, "step": 1110 }, { "epoch": 1.0632183908045978, "loss_full_dim": 0.22244104743003845, "loss_main": 0.4562321901321411, "loss_parscale": 0.46875, "loss_sub_dim": 0.23379112780094147, "loss_vclub": 0.000736236572265625, "parscale_sim": 0.98828125, "step": 1110 }, { "epoch": 1.064176245210728, "grad_norm": 5.834765911102295, "learning_rate": 2.3394736842105263e-06, "loss": 0.4562, "step": 1111 }, { "epoch": 1.064176245210728, "loss_full_dim": 0.37721559405326843, "loss_main": 0.7682867050170898, "loss_parscale": 0.7578125, "loss_sub_dim": 0.3910711407661438, "loss_vclub": 0.000865936279296875, "parscale_sim": 0.98828125, "step": 1111 }, { "epoch": 1.0651340996168583, "grad_norm": 7.559281826019287, "learning_rate": 2.3368421052631583e-06, "loss": 0.7683, "step": 1112 }, { "epoch": 1.0651340996168583, "loss_full_dim": 0.27058494091033936, "loss_main": 0.5540380477905273, "loss_parscale": 0.55859375, "loss_sub_dim": 0.283453106880188, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.98046875, "step": 1112 }, { "epoch": 1.0660919540229885, "grad_norm": 8.938424110412598, "learning_rate": 2.3342105263157894e-06, "loss": 0.554, "step": 1113 }, { "epoch": 1.0660919540229885, "loss_full_dim": 0.24521958827972412, "loss_main": 0.5034180879592896, "loss_parscale": 0.5078125, "loss_sub_dim": 0.25819849967956543, "loss_vclub": 0.000865936279296875, "parscale_sim": 0.98046875, "step": 1113 }, { "epoch": 1.0670498084291187, "grad_norm": 8.811627388000488, "learning_rate": 2.331578947368421e-06, "loss": 0.5034, "step": 1114 }, { "epoch": 1.0670498084291187, "loss_full_dim": 0.35400962829589844, "loss_main": 0.7241641283035278, "loss_parscale": 0.71875, "loss_sub_dim": 0.3701545000076294, "loss_vclub": 0.000835418701171875, "parscale_sim": 0.98046875, "step": 1114 }, { "epoch": 1.068007662835249, "grad_norm": 6.426570892333984, "learning_rate": 2.328947368421053e-06, "loss": 0.7242, "step": 1115 }, { "epoch": 1.068007662835249, "loss_full_dim": 0.30073946714401245, "loss_main": 0.613339900970459, "loss_parscale": 0.62109375, "loss_sub_dim": 0.31260043382644653, "loss_vclub": 0.00091552734375, "parscale_sim": 0.984375, "step": 1115 }, { "epoch": 1.0689655172413792, "grad_norm": 6.0770697593688965, "learning_rate": 2.326315789473684e-06, "loss": 0.6133, "step": 1116 }, { "epoch": 1.0689655172413792, "loss_full_dim": 0.28507450222969055, "loss_main": 0.583562970161438, "loss_parscale": 0.58203125, "loss_sub_dim": 0.2984884977340698, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.98828125, "step": 1116 }, { "epoch": 1.0699233716475096, "grad_norm": 6.373393535614014, "learning_rate": 2.323684210526316e-06, "loss": 0.5836, "step": 1117 }, { "epoch": 1.0699233716475096, "loss_full_dim": 0.2662012577056885, "loss_main": 0.5476673245429993, "loss_parscale": 0.5625, "loss_sub_dim": 0.2814660668373108, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.97265625, "step": 1117 }, { "epoch": 1.0708812260536398, "grad_norm": 7.824295997619629, "learning_rate": 2.3210526315789473e-06, "loss": 0.5477, "step": 1118 }, { "epoch": 1.0708812260536398, "loss_full_dim": 0.31127551198005676, "loss_main": 0.6369177103042603, "loss_parscale": 0.640625, "loss_sub_dim": 0.3256422281265259, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.984375, "step": 1118 }, { "epoch": 1.0718390804597702, "grad_norm": 11.999221801757812, "learning_rate": 2.3184210526315794e-06, "loss": 0.6369, "step": 1119 }, { "epoch": 1.0718390804597702, "loss_full_dim": 0.29602640867233276, "loss_main": 0.6050841212272644, "loss_parscale": 0.6015625, "loss_sub_dim": 0.30905771255493164, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.984375, "step": 1119 }, { "epoch": 1.0727969348659003, "grad_norm": 7.0079498291015625, "learning_rate": 2.3157894736842105e-06, "loss": 0.6051, "step": 1120 }, { "epoch": 1.0727969348659003, "loss_full_dim": 0.3232106864452362, "loss_main": 0.6602349281311035, "loss_parscale": 0.671875, "loss_sub_dim": 0.3370242714881897, "loss_vclub": 0.0008544921875, "parscale_sim": 0.984375, "step": 1120 }, { "epoch": 1.0737547892720307, "grad_norm": 411.6876220703125, "learning_rate": 2.313157894736842e-06, "loss": 0.6602, "step": 1121 }, { "epoch": 1.0737547892720307, "loss_full_dim": 0.29389044642448425, "loss_main": 0.6036094427108765, "loss_parscale": 0.6015625, "loss_sub_dim": 0.3097190260887146, "loss_vclub": 0.000827789306640625, "parscale_sim": 0.98828125, "step": 1121 }, { "epoch": 1.0747126436781609, "grad_norm": 10.984487533569336, "learning_rate": 2.310526315789474e-06, "loss": 0.6036, "step": 1122 }, { "epoch": 1.0747126436781609, "loss_full_dim": 0.32071802020072937, "loss_main": 0.6571551561355591, "loss_parscale": 0.65625, "loss_sub_dim": 0.3364371657371521, "loss_vclub": 0.0006103515625, "parscale_sim": 0.984375, "step": 1122 }, { "epoch": 1.0756704980842913, "grad_norm": 7.307413101196289, "learning_rate": 2.3078947368421053e-06, "loss": 0.6572, "step": 1123 }, { "epoch": 1.0756704980842913, "loss_full_dim": 0.27802178263664246, "loss_main": 0.5684332847595215, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2904115319252014, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.9765625, "step": 1123 }, { "epoch": 1.0766283524904214, "grad_norm": 5.9122161865234375, "learning_rate": 2.3052631578947373e-06, "loss": 0.5684, "step": 1124 }, { "epoch": 1.0766283524904214, "loss_full_dim": 0.3350101709365845, "loss_main": 0.6832419037818909, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3482317328453064, "loss_vclub": 0.0007171630859375, "parscale_sim": 0.984375, "step": 1124 }, { "epoch": 1.0775862068965518, "grad_norm": 7.0988898277282715, "learning_rate": 2.3026315789473684e-06, "loss": 0.6832, "step": 1125 }, { "epoch": 1.0775862068965518, "loss_full_dim": 0.28059613704681396, "loss_main": 0.5718510150909424, "loss_parscale": 0.578125, "loss_sub_dim": 0.2912549078464508, "loss_vclub": 0.000865936279296875, "parscale_sim": 0.984375, "step": 1125 }, { "epoch": 1.078544061302682, "grad_norm": 7.992008209228516, "learning_rate": 2.3000000000000004e-06, "loss": 0.5719, "step": 1126 }, { "epoch": 1.078544061302682, "loss_full_dim": 0.3519569933414459, "loss_main": 0.7166495323181152, "loss_parscale": 0.7109375, "loss_sub_dim": 0.3646925091743469, "loss_vclub": 0.000965118408203125, "parscale_sim": 0.984375, "step": 1126 }, { "epoch": 1.0795019157088124, "grad_norm": 7.753222465515137, "learning_rate": 2.2973684210526316e-06, "loss": 0.7166, "step": 1127 }, { "epoch": 1.0795019157088124, "loss_full_dim": 0.28195565938949585, "loss_main": 0.5772683024406433, "loss_parscale": 0.58203125, "loss_sub_dim": 0.29531264305114746, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.984375, "step": 1127 }, { "epoch": 1.0804597701149425, "grad_norm": 7.199512004852295, "learning_rate": 2.294736842105263e-06, "loss": 0.5773, "step": 1128 }, { "epoch": 1.0804597701149425, "loss_full_dim": 0.30790114402770996, "loss_main": 0.6293877959251404, "loss_parscale": 0.6328125, "loss_sub_dim": 0.3214866518974304, "loss_vclub": 0.000690460205078125, "parscale_sim": 0.984375, "step": 1128 }, { "epoch": 1.0814176245210727, "grad_norm": 8.173253059387207, "learning_rate": 2.2921052631578947e-06, "loss": 0.6294, "step": 1129 }, { "epoch": 1.0814176245210727, "loss_full_dim": 0.24786455929279327, "loss_main": 0.5082074999809265, "loss_parscale": 0.515625, "loss_sub_dim": 0.26034295558929443, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.984375, "step": 1129 }, { "epoch": 1.082375478927203, "grad_norm": 6.5619425773620605, "learning_rate": 2.2894736842105263e-06, "loss": 0.5082, "step": 1130 }, { "epoch": 1.082375478927203, "loss_full_dim": 0.29364150762557983, "loss_main": 0.5995548963546753, "loss_parscale": 0.6015625, "loss_sub_dim": 0.30591338872909546, "loss_vclub": 0.0008392333984375, "parscale_sim": 0.98828125, "step": 1130 }, { "epoch": 1.0833333333333333, "grad_norm": 6.478978633880615, "learning_rate": 2.2868421052631583e-06, "loss": 0.5996, "step": 1131 }, { "epoch": 1.0833333333333333, "loss_full_dim": 0.30657005310058594, "loss_main": 0.6257978677749634, "loss_parscale": 0.625, "loss_sub_dim": 0.31922781467437744, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.98828125, "step": 1131 }, { "epoch": 1.0842911877394636, "grad_norm": 8.24193286895752, "learning_rate": 2.2842105263157895e-06, "loss": 0.6258, "step": 1132 }, { "epoch": 1.0842911877394636, "loss_full_dim": 0.285299152135849, "loss_main": 0.5840750932693481, "loss_parscale": 0.58984375, "loss_sub_dim": 0.29877597093582153, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.984375, "step": 1132 }, { "epoch": 1.0852490421455938, "grad_norm": 3.575730085372925, "learning_rate": 2.2815789473684215e-06, "loss": 0.5841, "step": 1133 }, { "epoch": 1.0852490421455938, "loss_full_dim": 0.2872917056083679, "loss_main": 0.5849132537841797, "loss_parscale": 0.578125, "loss_sub_dim": 0.29762154817581177, "loss_vclub": 0.000652313232421875, "parscale_sim": 0.95703125, "step": 1133 }, { "epoch": 1.0862068965517242, "grad_norm": 7.603704929351807, "learning_rate": 2.2789473684210527e-06, "loss": 0.5849, "step": 1134 }, { "epoch": 1.0862068965517242, "loss_full_dim": 0.3316896855831146, "loss_main": 0.6777218580245972, "loss_parscale": 0.6796875, "loss_sub_dim": 0.34603220224380493, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.98828125, "step": 1134 }, { "epoch": 1.0871647509578544, "grad_norm": 7.2654571533203125, "learning_rate": 2.2763157894736847e-06, "loss": 0.6777, "step": 1135 }, { "epoch": 1.0871647509578544, "loss_full_dim": 0.29736483097076416, "loss_main": 0.6087695360183716, "loss_parscale": 0.609375, "loss_sub_dim": 0.3114047348499298, "loss_vclub": 0.00079345703125, "parscale_sim": 0.984375, "step": 1135 }, { "epoch": 1.0881226053639848, "grad_norm": 6.424653053283691, "learning_rate": 2.273684210526316e-06, "loss": 0.6088, "step": 1136 }, { "epoch": 1.0881226053639848, "loss_full_dim": 0.3073887825012207, "loss_main": 0.6267260313034058, "loss_parscale": 0.6328125, "loss_sub_dim": 0.31933724880218506, "loss_vclub": 0.00081634521484375, "parscale_sim": 0.98828125, "step": 1136 }, { "epoch": 1.089080459770115, "grad_norm": 8.354220390319824, "learning_rate": 2.2710526315789474e-06, "loss": 0.6267, "step": 1137 }, { "epoch": 1.089080459770115, "loss_full_dim": 0.2879335880279541, "loss_main": 0.5882987976074219, "loss_parscale": 0.58984375, "loss_sub_dim": 0.3003652095794678, "loss_vclub": 0.000759124755859375, "parscale_sim": 0.984375, "step": 1137 }, { "epoch": 1.0900383141762453, "grad_norm": 4.992157936096191, "learning_rate": 2.268421052631579e-06, "loss": 0.5883, "step": 1138 }, { "epoch": 1.0900383141762453, "loss_full_dim": 0.28759586811065674, "loss_main": 0.5883311033248901, "loss_parscale": 0.609375, "loss_sub_dim": 0.3007352352142334, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.9921875, "step": 1138 }, { "epoch": 1.0909961685823755, "grad_norm": 8.93797779083252, "learning_rate": 2.2657894736842106e-06, "loss": 0.5883, "step": 1139 }, { "epoch": 1.0909961685823755, "loss_full_dim": 0.3009207248687744, "loss_main": 0.6158133745193481, "loss_parscale": 0.61328125, "loss_sub_dim": 0.31489261984825134, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.98828125, "step": 1139 }, { "epoch": 1.0919540229885056, "grad_norm": 5.410682201385498, "learning_rate": 2.2631578947368426e-06, "loss": 0.6158, "step": 1140 }, { "epoch": 1.0919540229885056, "loss_full_dim": 0.28996407985687256, "loss_main": 0.5936713814735413, "loss_parscale": 0.59375, "loss_sub_dim": 0.3037073016166687, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.98828125, "step": 1140 }, { "epoch": 1.092911877394636, "grad_norm": 6.105095863342285, "learning_rate": 2.2605263157894737e-06, "loss": 0.5937, "step": 1141 }, { "epoch": 1.092911877394636, "loss_full_dim": 0.3271671235561371, "loss_main": 0.6704398393630981, "loss_parscale": 0.671875, "loss_sub_dim": 0.34327268600463867, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98046875, "step": 1141 }, { "epoch": 1.0938697318007662, "grad_norm": 8.982144355773926, "learning_rate": 2.2578947368421057e-06, "loss": 0.6704, "step": 1142 }, { "epoch": 1.0938697318007662, "loss_full_dim": 0.27582356333732605, "loss_main": 0.5656207799911499, "loss_parscale": 0.56640625, "loss_sub_dim": 0.28979718685150146, "loss_vclub": 0.00081634521484375, "parscale_sim": 0.984375, "step": 1142 }, { "epoch": 1.0948275862068966, "grad_norm": 8.213541984558105, "learning_rate": 2.255263157894737e-06, "loss": 0.5656, "step": 1143 }, { "epoch": 1.0948275862068966, "loss_full_dim": 0.326065331697464, "loss_main": 0.6653703451156616, "loss_parscale": 0.6640625, "loss_sub_dim": 0.33930498361587524, "loss_vclub": 0.000743865966796875, "parscale_sim": 0.984375, "step": 1143 }, { "epoch": 1.0957854406130267, "grad_norm": 10.080772399902344, "learning_rate": 2.2526315789473685e-06, "loss": 0.6654, "step": 1144 }, { "epoch": 1.0957854406130267, "loss_full_dim": 0.2897009551525116, "loss_main": 0.5944938659667969, "loss_parscale": 0.59375, "loss_sub_dim": 0.3047929108142853, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.984375, "step": 1144 }, { "epoch": 1.0967432950191571, "grad_norm": 10.520618438720703, "learning_rate": 2.25e-06, "loss": 0.5945, "step": 1145 }, { "epoch": 1.0967432950191571, "loss_full_dim": 0.23735779523849487, "loss_main": 0.4855539798736572, "loss_parscale": 0.48046875, "loss_sub_dim": 0.24819616973400116, "loss_vclub": 0.00102996826171875, "parscale_sim": 0.98828125, "step": 1145 }, { "epoch": 1.0977011494252873, "grad_norm": 67.17201232910156, "learning_rate": 2.2473684210526316e-06, "loss": 0.4856, "step": 1146 }, { "epoch": 1.0977011494252873, "loss_full_dim": 0.3056100904941559, "loss_main": 0.6249264478683472, "loss_parscale": 0.6328125, "loss_sub_dim": 0.31931638717651367, "loss_vclub": 0.000946044921875, "parscale_sim": 0.98828125, "step": 1146 }, { "epoch": 1.0986590038314177, "grad_norm": 9.803217887878418, "learning_rate": 2.2447368421052636e-06, "loss": 0.6249, "step": 1147 }, { "epoch": 1.0986590038314177, "loss_full_dim": 0.3043608069419861, "loss_main": 0.6219591498374939, "loss_parscale": 0.62109375, "loss_sub_dim": 0.3175983428955078, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.984375, "step": 1147 }, { "epoch": 1.0996168582375478, "grad_norm": 7.969117641448975, "learning_rate": 2.242105263157895e-06, "loss": 0.622, "step": 1148 }, { "epoch": 1.0996168582375478, "loss_full_dim": 0.25259682536125183, "loss_main": 0.5189375877380371, "loss_parscale": 0.515625, "loss_sub_dim": 0.2663407325744629, "loss_vclub": 0.0008544921875, "parscale_sim": 0.98046875, "step": 1148 }, { "epoch": 1.1005747126436782, "grad_norm": 8.721654891967773, "learning_rate": 2.239473684210527e-06, "loss": 0.5189, "step": 1149 }, { "epoch": 1.1005747126436782, "loss_full_dim": 0.2874239683151245, "loss_main": 0.5858932733535767, "loss_parscale": 0.58984375, "loss_sub_dim": 0.29846930503845215, "loss_vclub": 0.00070953369140625, "parscale_sim": 0.984375, "step": 1149 }, { "epoch": 1.1015325670498084, "grad_norm": 7.090831756591797, "learning_rate": 2.236842105263158e-06, "loss": 0.5859, "step": 1150 }, { "epoch": 1.1015325670498084, "loss_full_dim": 0.3026603162288666, "loss_main": 0.619178056716919, "loss_parscale": 0.6171875, "loss_sub_dim": 0.31651777029037476, "loss_vclub": 0.000621795654296875, "parscale_sim": 0.984375, "step": 1150 }, { "epoch": 1.1024904214559388, "grad_norm": 8.066030502319336, "learning_rate": 2.2342105263157895e-06, "loss": 0.6192, "step": 1151 }, { "epoch": 1.1024904214559388, "loss_full_dim": 0.2491990476846695, "loss_main": 0.5122828483581543, "loss_parscale": 0.51171875, "loss_sub_dim": 0.263083815574646, "loss_vclub": 0.000713348388671875, "parscale_sim": 0.98828125, "step": 1151 }, { "epoch": 1.103448275862069, "grad_norm": 9.3097562789917, "learning_rate": 2.231578947368421e-06, "loss": 0.5123, "step": 1152 }, { "epoch": 1.103448275862069, "loss_full_dim": 0.27292385697364807, "loss_main": 0.55901038646698, "loss_parscale": 0.5625, "loss_sub_dim": 0.2860864996910095, "loss_vclub": 0.000713348388671875, "parscale_sim": 0.98828125, "step": 1152 }, { "epoch": 1.1044061302681993, "grad_norm": 3.8785083293914795, "learning_rate": 2.2289473684210527e-06, "loss": 0.559, "step": 1153 }, { "epoch": 1.1044061302681993, "loss_full_dim": 0.28521469235420227, "loss_main": 0.5829793810844421, "loss_parscale": 0.5859375, "loss_sub_dim": 0.29776468873023987, "loss_vclub": 0.000843048095703125, "parscale_sim": 0.98828125, "step": 1153 }, { "epoch": 1.1053639846743295, "grad_norm": 7.674188137054443, "learning_rate": 2.2263157894736843e-06, "loss": 0.583, "step": 1154 }, { "epoch": 1.1053639846743295, "loss_full_dim": 0.247746542096138, "loss_main": 0.5083516836166382, "loss_parscale": 0.51171875, "loss_sub_dim": 0.2606051564216614, "loss_vclub": 0.0008392333984375, "parscale_sim": 0.984375, "step": 1154 }, { "epoch": 1.1063218390804597, "grad_norm": 6.208054542541504, "learning_rate": 2.223684210526316e-06, "loss": 0.5084, "step": 1155 }, { "epoch": 1.1063218390804597, "loss_full_dim": 0.33480197191238403, "loss_main": 0.6839752197265625, "loss_parscale": 0.68359375, "loss_sub_dim": 0.34917324781417847, "loss_vclub": 0.00089263916015625, "parscale_sim": 0.984375, "step": 1155 }, { "epoch": 1.10727969348659, "grad_norm": 45.408531188964844, "learning_rate": 2.221052631578948e-06, "loss": 0.684, "step": 1156 }, { "epoch": 1.10727969348659, "loss_full_dim": 0.31326034665107727, "loss_main": 0.641294002532959, "loss_parscale": 0.640625, "loss_sub_dim": 0.3280336558818817, "loss_vclub": 0.000835418701171875, "parscale_sim": 0.984375, "step": 1156 }, { "epoch": 1.1082375478927202, "grad_norm": 10.996526718139648, "learning_rate": 2.218421052631579e-06, "loss": 0.6413, "step": 1157 }, { "epoch": 1.1082375478927202, "loss_full_dim": 0.2682715356349945, "loss_main": 0.55037522315979, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2821037173271179, "loss_vclub": 0.000640869140625, "parscale_sim": 0.98828125, "step": 1157 }, { "epoch": 1.1091954022988506, "grad_norm": 7.896920204162598, "learning_rate": 2.2157894736842106e-06, "loss": 0.5504, "step": 1158 }, { "epoch": 1.1091954022988506, "loss_full_dim": 0.2690553665161133, "loss_main": 0.5512228012084961, "loss_parscale": 0.55078125, "loss_sub_dim": 0.2821674346923828, "loss_vclub": 0.000797271728515625, "parscale_sim": 0.98828125, "step": 1158 }, { "epoch": 1.1101532567049808, "grad_norm": 6.409956455230713, "learning_rate": 2.213157894736842e-06, "loss": 0.5512, "step": 1159 }, { "epoch": 1.1101532567049808, "loss_full_dim": 0.2650172710418701, "loss_main": 0.5395153760910034, "loss_parscale": 0.5390625, "loss_sub_dim": 0.2744980752468109, "loss_vclub": 0.0009613037109375, "parscale_sim": 0.984375, "step": 1159 }, { "epoch": 1.1111111111111112, "grad_norm": 7.925895690917969, "learning_rate": 2.2105263157894738e-06, "loss": 0.5395, "step": 1160 }, { "epoch": 1.1111111111111112, "loss_full_dim": 0.26544928550720215, "loss_main": 0.5441620945930481, "loss_parscale": 0.546875, "loss_sub_dim": 0.27871280908584595, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.984375, "step": 1160 }, { "epoch": 1.1120689655172413, "grad_norm": 5.8817338943481445, "learning_rate": 2.2078947368421054e-06, "loss": 0.5442, "step": 1161 }, { "epoch": 1.1120689655172413, "loss_full_dim": 0.263226717710495, "loss_main": 0.5405763983726501, "loss_parscale": 0.54296875, "loss_sub_dim": 0.27734968066215515, "loss_vclub": 0.00079345703125, "parscale_sim": 0.96484375, "step": 1161 }, { "epoch": 1.1130268199233717, "grad_norm": 6.16825532913208, "learning_rate": 2.205263157894737e-06, "loss": 0.5406, "step": 1162 }, { "epoch": 1.1130268199233717, "loss_full_dim": 0.2541714012622833, "loss_main": 0.5205517411231995, "loss_parscale": 0.515625, "loss_sub_dim": 0.26638033986091614, "loss_vclub": 0.000885009765625, "parscale_sim": 0.9765625, "step": 1162 }, { "epoch": 1.1139846743295019, "grad_norm": 6.128289222717285, "learning_rate": 2.2026315789473685e-06, "loss": 0.5206, "step": 1163 }, { "epoch": 1.1139846743295019, "loss_full_dim": 0.21202942728996277, "loss_main": 0.43367671966552734, "loss_parscale": 0.44140625, "loss_sub_dim": 0.22164730727672577, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.98828125, "step": 1163 }, { "epoch": 1.1149425287356323, "grad_norm": 7.436573505401611, "learning_rate": 2.2e-06, "loss": 0.4337, "step": 1164 }, { "epoch": 1.1149425287356323, "loss_full_dim": 0.31564202904701233, "loss_main": 0.6446393728256226, "loss_parscale": 0.63671875, "loss_sub_dim": 0.32899734377861023, "loss_vclub": 0.000919342041015625, "parscale_sim": 0.98828125, "step": 1164 }, { "epoch": 1.1159003831417624, "grad_norm": 6.337496280670166, "learning_rate": 2.1973684210526317e-06, "loss": 0.6446, "step": 1165 }, { "epoch": 1.1159003831417624, "loss_full_dim": 0.28866252303123474, "loss_main": 0.5919716358184814, "loss_parscale": 0.58203125, "loss_sub_dim": 0.3033091425895691, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.98828125, "step": 1165 }, { "epoch": 1.1168582375478928, "grad_norm": 6.463403224945068, "learning_rate": 2.1947368421052633e-06, "loss": 0.592, "step": 1166 }, { "epoch": 1.1168582375478928, "loss_full_dim": 0.2953093945980072, "loss_main": 0.604609489440918, "loss_parscale": 0.609375, "loss_sub_dim": 0.30930009484291077, "loss_vclub": 0.00093841552734375, "parscale_sim": 0.984375, "step": 1166 }, { "epoch": 1.117816091954023, "grad_norm": 6.365782260894775, "learning_rate": 2.192105263157895e-06, "loss": 0.6046, "step": 1167 }, { "epoch": 1.117816091954023, "loss_full_dim": 0.28306981921195984, "loss_main": 0.5784599184989929, "loss_parscale": 0.578125, "loss_sub_dim": 0.2953900992870331, "loss_vclub": 0.000865936279296875, "parscale_sim": 0.98046875, "step": 1167 }, { "epoch": 1.1187739463601534, "grad_norm": 6.104093551635742, "learning_rate": 2.1894736842105264e-06, "loss": 0.5785, "step": 1168 }, { "epoch": 1.1187739463601534, "loss_full_dim": 0.2547813951969147, "loss_main": 0.5252171754837036, "loss_parscale": 0.5234375, "loss_sub_dim": 0.27043581008911133, "loss_vclub": 0.000823974609375, "parscale_sim": 0.98046875, "step": 1168 }, { "epoch": 1.1197318007662835, "grad_norm": 8.602676391601562, "learning_rate": 2.186842105263158e-06, "loss": 0.5252, "step": 1169 }, { "epoch": 1.1197318007662835, "loss_full_dim": 0.29152363538742065, "loss_main": 0.5966161489486694, "loss_parscale": 0.59375, "loss_sub_dim": 0.3050924837589264, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.984375, "step": 1169 }, { "epoch": 1.1206896551724137, "grad_norm": 7.003392219543457, "learning_rate": 2.1842105263157896e-06, "loss": 0.5966, "step": 1170 }, { "epoch": 1.1206896551724137, "loss_full_dim": 0.2807767987251282, "loss_main": 0.5754196643829346, "loss_parscale": 0.57421875, "loss_sub_dim": 0.2946428656578064, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.98828125, "step": 1170 }, { "epoch": 1.121647509578544, "grad_norm": 5.590615272521973, "learning_rate": 2.181578947368421e-06, "loss": 0.5754, "step": 1171 }, { "epoch": 1.121647509578544, "loss_full_dim": 0.29724499583244324, "loss_main": 0.6086394786834717, "loss_parscale": 0.6171875, "loss_sub_dim": 0.31139448285102844, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.98046875, "step": 1171 }, { "epoch": 1.1226053639846743, "grad_norm": 7.3761420249938965, "learning_rate": 2.1789473684210528e-06, "loss": 0.6086, "step": 1172 }, { "epoch": 1.1226053639846743, "loss_full_dim": 0.3158625364303589, "loss_main": 0.6474127173423767, "loss_parscale": 0.66015625, "loss_sub_dim": 0.3315501809120178, "loss_vclub": 0.00092315673828125, "parscale_sim": 0.984375, "step": 1172 }, { "epoch": 1.1235632183908046, "grad_norm": 8.095855712890625, "learning_rate": 2.1763157894736843e-06, "loss": 0.6474, "step": 1173 }, { "epoch": 1.1235632183908046, "loss_full_dim": 0.25871577858924866, "loss_main": 0.5295745134353638, "loss_parscale": 0.5390625, "loss_sub_dim": 0.2708587050437927, "loss_vclub": 0.000690460205078125, "parscale_sim": 0.98046875, "step": 1173 }, { "epoch": 1.1245210727969348, "grad_norm": 34.683128356933594, "learning_rate": 2.173684210526316e-06, "loss": 0.5296, "step": 1174 }, { "epoch": 1.1245210727969348, "loss_full_dim": 0.33320143818855286, "loss_main": 0.6808953285217285, "loss_parscale": 0.68359375, "loss_sub_dim": 0.34769386053085327, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.98046875, "step": 1174 }, { "epoch": 1.1254789272030652, "grad_norm": 12.459972381591797, "learning_rate": 2.1710526315789475e-06, "loss": 0.6809, "step": 1175 }, { "epoch": 1.1254789272030652, "loss_full_dim": 0.27008044719696045, "loss_main": 0.5553696155548096, "loss_parscale": 0.56640625, "loss_sub_dim": 0.2852891981601715, "loss_vclub": 0.000804901123046875, "parscale_sim": 0.98828125, "step": 1175 }, { "epoch": 1.1264367816091954, "grad_norm": 7.567350387573242, "learning_rate": 2.168421052631579e-06, "loss": 0.5554, "step": 1176 }, { "epoch": 1.1264367816091954, "loss_full_dim": 0.27611666917800903, "loss_main": 0.5619668960571289, "loss_parscale": 0.56640625, "loss_sub_dim": 0.28585025668144226, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.98828125, "step": 1176 }, { "epoch": 1.1273946360153257, "grad_norm": 13.037087440490723, "learning_rate": 2.1657894736842107e-06, "loss": 0.562, "step": 1177 }, { "epoch": 1.1273946360153257, "loss_full_dim": 0.28627046942710876, "loss_main": 0.5862719416618347, "loss_parscale": 0.5859375, "loss_sub_dim": 0.30000147223472595, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.98828125, "step": 1177 }, { "epoch": 1.128352490421456, "grad_norm": 10.743571281433105, "learning_rate": 2.1631578947368423e-06, "loss": 0.5863, "step": 1178 }, { "epoch": 1.128352490421456, "loss_full_dim": 0.2975795567035675, "loss_main": 0.6107522249221802, "loss_parscale": 0.6171875, "loss_sub_dim": 0.31317269802093506, "loss_vclub": 0.000812530517578125, "parscale_sim": 0.98046875, "step": 1178 }, { "epoch": 1.1293103448275863, "grad_norm": 5.700970649719238, "learning_rate": 2.160526315789474e-06, "loss": 0.6108, "step": 1179 }, { "epoch": 1.1293103448275863, "loss_full_dim": 0.32018938660621643, "loss_main": 0.6539007425308228, "loss_parscale": 0.65625, "loss_sub_dim": 0.33371132612228394, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98828125, "step": 1179 }, { "epoch": 1.1302681992337165, "grad_norm": 7.473668098449707, "learning_rate": 2.1578947368421054e-06, "loss": 0.6539, "step": 1180 }, { "epoch": 1.1302681992337165, "loss_full_dim": 0.3009187579154968, "loss_main": 0.6127888560295105, "loss_parscale": 0.61328125, "loss_sub_dim": 0.31187009811401367, "loss_vclub": 0.0011138916015625, "parscale_sim": 0.98828125, "step": 1180 }, { "epoch": 1.1312260536398466, "grad_norm": 9.231432914733887, "learning_rate": 2.155263157894737e-06, "loss": 0.6128, "step": 1181 }, { "epoch": 1.1312260536398466, "loss_full_dim": 0.28455954790115356, "loss_main": 0.5823042392730713, "loss_parscale": 0.58203125, "loss_sub_dim": 0.2977447211742401, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.98828125, "step": 1181 }, { "epoch": 1.132183908045977, "grad_norm": 7.954113006591797, "learning_rate": 2.1526315789473686e-06, "loss": 0.5823, "step": 1182 }, { "epoch": 1.132183908045977, "loss_full_dim": 0.27945029735565186, "loss_main": 0.5714790225028992, "loss_parscale": 0.578125, "loss_sub_dim": 0.2920287251472473, "loss_vclub": 0.000820159912109375, "parscale_sim": 0.9765625, "step": 1182 }, { "epoch": 1.1331417624521074, "grad_norm": 10.399324417114258, "learning_rate": 2.15e-06, "loss": 0.5715, "step": 1183 }, { "epoch": 1.1331417624521074, "loss_full_dim": 0.30629199743270874, "loss_main": 0.6279555559158325, "loss_parscale": 0.62890625, "loss_sub_dim": 0.3216635584831238, "loss_vclub": 0.0009307861328125, "parscale_sim": 0.984375, "step": 1183 }, { "epoch": 1.1340996168582376, "grad_norm": 7.752561092376709, "learning_rate": 2.1473684210526317e-06, "loss": 0.628, "step": 1184 }, { "epoch": 1.1340996168582376, "loss_full_dim": 0.2612285912036896, "loss_main": 0.5336484909057617, "loss_parscale": 0.53515625, "loss_sub_dim": 0.27241989970207214, "loss_vclub": 0.00079345703125, "parscale_sim": 0.98828125, "step": 1184 }, { "epoch": 1.1350574712643677, "grad_norm": 6.502110004425049, "learning_rate": 2.1447368421052633e-06, "loss": 0.5336, "step": 1185 }, { "epoch": 1.1350574712643677, "loss_full_dim": 0.2949298322200775, "loss_main": 0.603441596031189, "loss_parscale": 0.609375, "loss_sub_dim": 0.30851173400878906, "loss_vclub": 0.000873565673828125, "parscale_sim": 0.984375, "step": 1185 }, { "epoch": 1.1360153256704981, "grad_norm": 7.279881477355957, "learning_rate": 2.142105263157895e-06, "loss": 0.6034, "step": 1186 }, { "epoch": 1.1360153256704981, "loss_full_dim": 0.37167584896087646, "loss_main": 0.7583233118057251, "loss_parscale": 0.7578125, "loss_sub_dim": 0.386647492647171, "loss_vclub": 0.000820159912109375, "parscale_sim": 0.98046875, "step": 1186 }, { "epoch": 1.1369731800766283, "grad_norm": 8.985945701599121, "learning_rate": 2.1394736842105265e-06, "loss": 0.7583, "step": 1187 }, { "epoch": 1.1369731800766283, "loss_full_dim": 0.2942744791507721, "loss_main": 0.6020634174346924, "loss_parscale": 0.59375, "loss_sub_dim": 0.3077889680862427, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.984375, "step": 1187 }, { "epoch": 1.1379310344827587, "grad_norm": 7.924509525299072, "learning_rate": 2.136842105263158e-06, "loss": 0.6021, "step": 1188 }, { "epoch": 1.1379310344827587, "loss_full_dim": 0.2580330967903137, "loss_main": 0.5289143323898315, "loss_parscale": 0.53515625, "loss_sub_dim": 0.27088120579719543, "loss_vclub": 0.000972747802734375, "parscale_sim": 0.984375, "step": 1188 }, { "epoch": 1.1388888888888888, "grad_norm": 7.471564769744873, "learning_rate": 2.1342105263157897e-06, "loss": 0.5289, "step": 1189 }, { "epoch": 1.1388888888888888, "loss_full_dim": 0.3019498288631439, "loss_main": 0.6182044744491577, "loss_parscale": 0.6171875, "loss_sub_dim": 0.3162546753883362, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.98046875, "step": 1189 }, { "epoch": 1.1398467432950192, "grad_norm": 7.760400295257568, "learning_rate": 2.1315789473684212e-06, "loss": 0.6182, "step": 1190 }, { "epoch": 1.1398467432950192, "loss_full_dim": 0.3191104531288147, "loss_main": 0.6512576937675476, "loss_parscale": 0.65625, "loss_sub_dim": 0.3321472406387329, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.98828125, "step": 1190 }, { "epoch": 1.1408045977011494, "grad_norm": 8.085426330566406, "learning_rate": 2.128947368421053e-06, "loss": 0.6513, "step": 1191 }, { "epoch": 1.1408045977011494, "loss_full_dim": 0.29127198457717896, "loss_main": 0.5958532094955444, "loss_parscale": 0.59375, "loss_sub_dim": 0.3045811951160431, "loss_vclub": 0.00089263916015625, "parscale_sim": 0.98828125, "step": 1191 }, { "epoch": 1.1417624521072798, "grad_norm": 6.64500093460083, "learning_rate": 2.1263157894736844e-06, "loss": 0.5959, "step": 1192 }, { "epoch": 1.1417624521072798, "loss_full_dim": 0.2829969525337219, "loss_main": 0.5790597200393677, "loss_parscale": 0.5859375, "loss_sub_dim": 0.29606279730796814, "loss_vclub": 0.00093841552734375, "parscale_sim": 0.9921875, "step": 1192 }, { "epoch": 1.14272030651341, "grad_norm": 8.049617767333984, "learning_rate": 2.123684210526316e-06, "loss": 0.5791, "step": 1193 }, { "epoch": 1.14272030651341, "loss_full_dim": 0.2403327077627182, "loss_main": 0.49483412504196167, "loss_parscale": 0.5, "loss_sub_dim": 0.2545014023780823, "loss_vclub": 0.000789642333984375, "parscale_sim": 0.984375, "step": 1193 }, { "epoch": 1.1436781609195403, "grad_norm": 10.66437816619873, "learning_rate": 2.1210526315789476e-06, "loss": 0.4948, "step": 1194 }, { "epoch": 1.1436781609195403, "loss_full_dim": 0.2948138117790222, "loss_main": 0.6021547913551331, "loss_parscale": 0.609375, "loss_sub_dim": 0.30734097957611084, "loss_vclub": 0.0006561279296875, "parscale_sim": 0.984375, "step": 1194 }, { "epoch": 1.1446360153256705, "grad_norm": 8.270486831665039, "learning_rate": 2.118421052631579e-06, "loss": 0.6022, "step": 1195 }, { "epoch": 1.1446360153256705, "loss_full_dim": 0.2733437120914459, "loss_main": 0.5593453645706177, "loss_parscale": 0.5625, "loss_sub_dim": 0.28600168228149414, "loss_vclub": 0.00089263916015625, "parscale_sim": 0.984375, "step": 1195 }, { "epoch": 1.1455938697318007, "grad_norm": 9.4451904296875, "learning_rate": 2.1157894736842107e-06, "loss": 0.5593, "step": 1196 }, { "epoch": 1.1455938697318007, "loss_full_dim": 0.260856568813324, "loss_main": 0.5346924662590027, "loss_parscale": 0.5390625, "loss_sub_dim": 0.2738358974456787, "loss_vclub": 0.0008544921875, "parscale_sim": 0.984375, "step": 1196 }, { "epoch": 1.146551724137931, "grad_norm": 8.65373420715332, "learning_rate": 2.1131578947368423e-06, "loss": 0.5347, "step": 1197 }, { "epoch": 1.146551724137931, "loss_full_dim": 0.24978165328502655, "loss_main": 0.5113109946250916, "loss_parscale": 0.515625, "loss_sub_dim": 0.2615293562412262, "loss_vclub": 0.000934600830078125, "parscale_sim": 0.98046875, "step": 1197 }, { "epoch": 1.1475095785440612, "grad_norm": 10.767964363098145, "learning_rate": 2.110526315789474e-06, "loss": 0.5113, "step": 1198 }, { "epoch": 1.1475095785440612, "loss_full_dim": 0.3001728951931, "loss_main": 0.6172642707824707, "loss_parscale": 0.625, "loss_sub_dim": 0.3170913755893707, "loss_vclub": 0.000946044921875, "parscale_sim": 0.98828125, "step": 1198 }, { "epoch": 1.1484674329501916, "grad_norm": 7.362032890319824, "learning_rate": 2.1078947368421055e-06, "loss": 0.6173, "step": 1199 }, { "epoch": 1.1484674329501916, "loss_full_dim": 0.28838977217674255, "loss_main": 0.5903496146202087, "loss_parscale": 0.60546875, "loss_sub_dim": 0.3019598424434662, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.984375, "step": 1199 }, { "epoch": 1.1494252873563218, "grad_norm": 10.557988166809082, "learning_rate": 2.105263157894737e-06, "loss": 0.5903, "step": 1200 }, { "epoch": 1.1494252873563218, "loss_full_dim": 0.27709564566612244, "loss_main": 0.5682976841926575, "loss_parscale": 0.5703125, "loss_sub_dim": 0.29120203852653503, "loss_vclub": 0.000885009765625, "parscale_sim": 0.984375, "step": 1200 }, { "epoch": 1.1503831417624522, "grad_norm": 7.163814544677734, "learning_rate": 2.1026315789473686e-06, "loss": 0.5683, "step": 1201 }, { "epoch": 1.1503831417624522, "loss_full_dim": 0.3074781894683838, "loss_main": 0.6290776133537292, "loss_parscale": 0.62890625, "loss_sub_dim": 0.32159942388534546, "loss_vclub": 0.000865936279296875, "parscale_sim": 0.984375, "step": 1201 }, { "epoch": 1.1513409961685823, "grad_norm": 9.909102439880371, "learning_rate": 2.1000000000000002e-06, "loss": 0.6291, "step": 1202 }, { "epoch": 1.1513409961685823, "loss_full_dim": 0.29937902092933655, "loss_main": 0.6127246618270874, "loss_parscale": 0.6171875, "loss_sub_dim": 0.31334567070007324, "loss_vclub": 0.000728607177734375, "parscale_sim": 0.98828125, "step": 1202 }, { "epoch": 1.1522988505747127, "grad_norm": 8.879443168640137, "learning_rate": 2.097368421052632e-06, "loss": 0.6127, "step": 1203 }, { "epoch": 1.1522988505747127, "loss_full_dim": 0.2701530456542969, "loss_main": 0.5538998246192932, "loss_parscale": 0.55078125, "loss_sub_dim": 0.28374677896499634, "loss_vclub": 0.00099945068359375, "parscale_sim": 0.984375, "step": 1203 }, { "epoch": 1.1532567049808429, "grad_norm": 6.495558738708496, "learning_rate": 2.0947368421052634e-06, "loss": 0.5539, "step": 1204 }, { "epoch": 1.1532567049808429, "loss_full_dim": 0.30124449729919434, "loss_main": 0.6169938445091248, "loss_parscale": 0.6171875, "loss_sub_dim": 0.3157493472099304, "loss_vclub": 0.00083160400390625, "parscale_sim": 0.984375, "step": 1204 }, { "epoch": 1.1542145593869733, "grad_norm": 8.367871284484863, "learning_rate": 2.092105263157895e-06, "loss": 0.617, "step": 1205 }, { "epoch": 1.1542145593869733, "loss_full_dim": 0.29938220977783203, "loss_main": 0.6120245456695557, "loss_parscale": 0.609375, "loss_sub_dim": 0.31264233589172363, "loss_vclub": 0.00064849853515625, "parscale_sim": 0.984375, "step": 1205 }, { "epoch": 1.1551724137931034, "grad_norm": 8.742072105407715, "learning_rate": 2.0894736842105266e-06, "loss": 0.612, "step": 1206 }, { "epoch": 1.1551724137931034, "loss_full_dim": 0.30769452452659607, "loss_main": 0.6285907030105591, "loss_parscale": 0.63671875, "loss_sub_dim": 0.3208962082862854, "loss_vclub": 0.000896453857421875, "parscale_sim": 0.984375, "step": 1206 }, { "epoch": 1.1561302681992338, "grad_norm": 9.195372581481934, "learning_rate": 2.086842105263158e-06, "loss": 0.6286, "step": 1207 }, { "epoch": 1.1561302681992338, "loss_full_dim": 0.2499464899301529, "loss_main": 0.5103291869163513, "loss_parscale": 0.515625, "loss_sub_dim": 0.2603827118873596, "loss_vclub": 0.0008544921875, "parscale_sim": 0.98828125, "step": 1207 }, { "epoch": 1.157088122605364, "grad_norm": 8.28538703918457, "learning_rate": 2.0842105263157897e-06, "loss": 0.5103, "step": 1208 }, { "epoch": 1.157088122605364, "loss_full_dim": 0.2659127712249756, "loss_main": 0.5430788993835449, "loss_parscale": 0.5546875, "loss_sub_dim": 0.27716612815856934, "loss_vclub": 0.000972747802734375, "parscale_sim": 0.984375, "step": 1208 }, { "epoch": 1.1580459770114944, "grad_norm": 5.9854536056518555, "learning_rate": 2.0815789473684213e-06, "loss": 0.5431, "step": 1209 }, { "epoch": 1.1580459770114944, "loss_full_dim": 0.31566745042800903, "loss_main": 0.6471540331840515, "loss_parscale": 0.6484375, "loss_sub_dim": 0.3314865827560425, "loss_vclub": 0.00083160400390625, "parscale_sim": 0.984375, "step": 1209 }, { "epoch": 1.1590038314176245, "grad_norm": 8.17809009552002, "learning_rate": 2.078947368421053e-06, "loss": 0.6472, "step": 1210 }, { "epoch": 1.1590038314176245, "loss_full_dim": 0.31404027342796326, "loss_main": 0.6424494981765747, "loss_parscale": 0.640625, "loss_sub_dim": 0.32840922474861145, "loss_vclub": 0.0005950927734375, "parscale_sim": 0.9765625, "step": 1210 }, { "epoch": 1.1599616858237547, "grad_norm": 5.4037652015686035, "learning_rate": 2.0763157894736845e-06, "loss": 0.6424, "step": 1211 }, { "epoch": 1.1599616858237547, "loss_full_dim": 0.2784048914909363, "loss_main": 0.568786084651947, "loss_parscale": 0.578125, "loss_sub_dim": 0.29038119316101074, "loss_vclub": 0.000926971435546875, "parscale_sim": 0.98046875, "step": 1211 }, { "epoch": 1.160919540229885, "grad_norm": 7.510874271392822, "learning_rate": 2.073684210526316e-06, "loss": 0.5688, "step": 1212 }, { "epoch": 1.160919540229885, "loss_full_dim": 0.321826308965683, "loss_main": 0.6580244302749634, "loss_parscale": 0.65625, "loss_sub_dim": 0.336198091506958, "loss_vclub": 0.000888824462890625, "parscale_sim": 0.96484375, "step": 1212 }, { "epoch": 1.1618773946360152, "grad_norm": 9.766109466552734, "learning_rate": 2.0710526315789476e-06, "loss": 0.658, "step": 1213 }, { "epoch": 1.1618773946360152, "loss_full_dim": 0.26942554116249084, "loss_main": 0.5510565042495728, "loss_parscale": 0.5625, "loss_sub_dim": 0.2816309332847595, "loss_vclub": 0.00091552734375, "parscale_sim": 0.98828125, "step": 1213 }, { "epoch": 1.1628352490421456, "grad_norm": 5.747315406799316, "learning_rate": 2.068421052631579e-06, "loss": 0.5511, "step": 1214 }, { "epoch": 1.1628352490421456, "loss_full_dim": 0.3324628472328186, "loss_main": 0.6773161888122559, "loss_parscale": 0.6796875, "loss_sub_dim": 0.34485334157943726, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.984375, "step": 1214 }, { "epoch": 1.1637931034482758, "grad_norm": 5.860902309417725, "learning_rate": 2.0657894736842108e-06, "loss": 0.6773, "step": 1215 }, { "epoch": 1.1637931034482758, "loss_full_dim": 0.28998875617980957, "loss_main": 0.592993438243866, "loss_parscale": 0.5859375, "loss_sub_dim": 0.3030046820640564, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.98046875, "step": 1215 }, { "epoch": 1.1647509578544062, "grad_norm": 14.083077430725098, "learning_rate": 2.0631578947368424e-06, "loss": 0.593, "step": 1216 }, { "epoch": 1.1647509578544062, "loss_full_dim": 0.2780733108520508, "loss_main": 0.5684295892715454, "loss_parscale": 0.56640625, "loss_sub_dim": 0.29035627841949463, "loss_vclub": 0.000926971435546875, "parscale_sim": 0.984375, "step": 1216 }, { "epoch": 1.1657088122605364, "grad_norm": 6.690465450286865, "learning_rate": 2.060526315789474e-06, "loss": 0.5684, "step": 1217 }, { "epoch": 1.1657088122605364, "loss_full_dim": 0.25745320320129395, "loss_main": 0.5310872197151184, "loss_parscale": 0.53125, "loss_sub_dim": 0.27363401651382446, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.984375, "step": 1217 }, { "epoch": 1.1666666666666667, "grad_norm": 5.4349045753479, "learning_rate": 2.0578947368421055e-06, "loss": 0.5311, "step": 1218 }, { "epoch": 1.1666666666666667, "loss_full_dim": 0.27605533599853516, "loss_main": 0.562751293182373, "loss_parscale": 0.5625, "loss_sub_dim": 0.2866959571838379, "loss_vclub": 0.000926971435546875, "parscale_sim": 0.98828125, "step": 1218 }, { "epoch": 1.167624521072797, "grad_norm": 5.75303316116333, "learning_rate": 2.055263157894737e-06, "loss": 0.5628, "step": 1219 }, { "epoch": 1.167624521072797, "loss_full_dim": 0.27525967359542847, "loss_main": 0.5646566152572632, "loss_parscale": 0.5625, "loss_sub_dim": 0.28939691185951233, "loss_vclub": 0.00079345703125, "parscale_sim": 0.984375, "step": 1219 }, { "epoch": 1.1685823754789273, "grad_norm": 6.025733947753906, "learning_rate": 2.0526315789473687e-06, "loss": 0.5647, "step": 1220 }, { "epoch": 1.1685823754789273, "loss_full_dim": 0.2732774019241333, "loss_main": 0.559736967086792, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2864595651626587, "loss_vclub": 0.000957489013671875, "parscale_sim": 0.98828125, "step": 1220 }, { "epoch": 1.1695402298850575, "grad_norm": 8.358555793762207, "learning_rate": 2.05e-06, "loss": 0.5597, "step": 1221 }, { "epoch": 1.1695402298850575, "loss_full_dim": 0.3058362603187561, "loss_main": 0.6276639103889465, "loss_parscale": 0.63671875, "loss_sub_dim": 0.32182765007019043, "loss_vclub": 0.000865936279296875, "parscale_sim": 0.984375, "step": 1221 }, { "epoch": 1.1704980842911876, "grad_norm": 5.3386921882629395, "learning_rate": 2.047368421052632e-06, "loss": 0.6277, "step": 1222 }, { "epoch": 1.1704980842911876, "loss_full_dim": 0.3339465260505676, "loss_main": 0.6812994480133057, "loss_parscale": 0.6953125, "loss_sub_dim": 0.34735292196273804, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.984375, "step": 1222 }, { "epoch": 1.171455938697318, "grad_norm": 9.727170944213867, "learning_rate": 2.0447368421052634e-06, "loss": 0.6813, "step": 1223 }, { "epoch": 1.171455938697318, "loss_full_dim": 0.3301299810409546, "loss_main": 0.6717184782028198, "loss_parscale": 0.671875, "loss_sub_dim": 0.3415885269641876, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.98828125, "step": 1223 }, { "epoch": 1.1724137931034484, "grad_norm": 7.830484867095947, "learning_rate": 2.042105263157895e-06, "loss": 0.6717, "step": 1224 }, { "epoch": 1.1724137931034484, "loss_full_dim": 0.2916133999824524, "loss_main": 0.5959782600402832, "loss_parscale": 0.609375, "loss_sub_dim": 0.3043648600578308, "loss_vclub": 0.000885009765625, "parscale_sim": 0.98046875, "step": 1224 }, { "epoch": 1.1733716475095786, "grad_norm": 7.925443172454834, "learning_rate": 2.0394736842105266e-06, "loss": 0.596, "step": 1225 }, { "epoch": 1.1733716475095786, "loss_full_dim": 0.26477259397506714, "loss_main": 0.5424202680587769, "loss_parscale": 0.546875, "loss_sub_dim": 0.2776477038860321, "loss_vclub": 0.000835418701171875, "parscale_sim": 0.98828125, "step": 1225 }, { "epoch": 1.1743295019157087, "grad_norm": 7.382889747619629, "learning_rate": 2.036842105263158e-06, "loss": 0.5424, "step": 1226 }, { "epoch": 1.1743295019157087, "loss_full_dim": 0.24538812041282654, "loss_main": 0.5024079084396362, "loss_parscale": 0.5, "loss_sub_dim": 0.2570197582244873, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.98046875, "step": 1226 }, { "epoch": 1.1752873563218391, "grad_norm": 4.971694469451904, "learning_rate": 2.0342105263157898e-06, "loss": 0.5024, "step": 1227 }, { "epoch": 1.1752873563218391, "loss_full_dim": 0.3422704041004181, "loss_main": 0.696713924407959, "loss_parscale": 0.6953125, "loss_sub_dim": 0.3544434905052185, "loss_vclub": 0.00081634521484375, "parscale_sim": 0.984375, "step": 1227 }, { "epoch": 1.1762452107279693, "grad_norm": 10.056656837463379, "learning_rate": 2.031578947368421e-06, "loss": 0.6967, "step": 1228 }, { "epoch": 1.1762452107279693, "loss_full_dim": 0.2812417447566986, "loss_main": 0.5759122371673584, "loss_parscale": 0.58203125, "loss_sub_dim": 0.2946705222129822, "loss_vclub": 0.000850677490234375, "parscale_sim": 0.98828125, "step": 1228 }, { "epoch": 1.1772030651340997, "grad_norm": 9.189476013183594, "learning_rate": 2.028947368421053e-06, "loss": 0.5759, "step": 1229 }, { "epoch": 1.1772030651340997, "loss_full_dim": 0.31721824407577515, "loss_main": 0.6495383977890015, "loss_parscale": 0.65625, "loss_sub_dim": 0.3323201537132263, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.984375, "step": 1229 }, { "epoch": 1.1781609195402298, "grad_norm": 6.5008368492126465, "learning_rate": 2.026315789473684e-06, "loss": 0.6495, "step": 1230 }, { "epoch": 1.1781609195402298, "loss_full_dim": 0.2667295038700104, "loss_main": 0.5462836027145386, "loss_parscale": 0.54296875, "loss_sub_dim": 0.2795541286468506, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.98828125, "step": 1230 }, { "epoch": 1.1791187739463602, "grad_norm": 12.113905906677246, "learning_rate": 2.023684210526316e-06, "loss": 0.5463, "step": 1231 }, { "epoch": 1.1791187739463602, "loss_full_dim": 0.2689402997493744, "loss_main": 0.550423264503479, "loss_parscale": 0.5546875, "loss_sub_dim": 0.281482994556427, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.984375, "step": 1231 }, { "epoch": 1.1800766283524904, "grad_norm": 4.822048187255859, "learning_rate": 2.0210526315789477e-06, "loss": 0.5504, "step": 1232 }, { "epoch": 1.1800766283524904, "loss_full_dim": 0.2585170269012451, "loss_main": 0.5276925563812256, "loss_parscale": 0.53515625, "loss_sub_dim": 0.26917555928230286, "loss_vclub": 0.000965118408203125, "parscale_sim": 0.984375, "step": 1232 }, { "epoch": 1.1810344827586208, "grad_norm": 7.627866744995117, "learning_rate": 2.0184210526315793e-06, "loss": 0.5277, "step": 1233 }, { "epoch": 1.1810344827586208, "loss_full_dim": 0.28618690371513367, "loss_main": 0.5858911275863647, "loss_parscale": 0.59375, "loss_sub_dim": 0.29970425367355347, "loss_vclub": 0.0010528564453125, "parscale_sim": 0.984375, "step": 1233 }, { "epoch": 1.181992337164751, "grad_norm": 8.162261009216309, "learning_rate": 2.015789473684211e-06, "loss": 0.5859, "step": 1234 }, { "epoch": 1.181992337164751, "loss_full_dim": 0.2907581925392151, "loss_main": 0.5928761959075928, "loss_parscale": 0.5859375, "loss_sub_dim": 0.3021180331707001, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.98828125, "step": 1234 }, { "epoch": 1.1829501915708813, "grad_norm": 7.874083995819092, "learning_rate": 2.013157894736842e-06, "loss": 0.5929, "step": 1235 }, { "epoch": 1.1829501915708813, "loss_full_dim": 0.28589117527008057, "loss_main": 0.5879839658737183, "loss_parscale": 0.5859375, "loss_sub_dim": 0.3020927906036377, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.98828125, "step": 1235 }, { "epoch": 1.1839080459770115, "grad_norm": 16.32649040222168, "learning_rate": 2.010526315789474e-06, "loss": 0.588, "step": 1236 }, { "epoch": 1.1839080459770115, "loss_full_dim": 0.2822301685810089, "loss_main": 0.577703595161438, "loss_parscale": 0.58203125, "loss_sub_dim": 0.2954733967781067, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.98046875, "step": 1236 }, { "epoch": 1.1848659003831417, "grad_norm": 6.969128131866455, "learning_rate": 2.007894736842105e-06, "loss": 0.5777, "step": 1237 }, { "epoch": 1.1848659003831417, "loss_full_dim": 0.2336949110031128, "loss_main": 0.47980833053588867, "loss_parscale": 0.484375, "loss_sub_dim": 0.24611343443393707, "loss_vclub": 0.00092315673828125, "parscale_sim": 0.98828125, "step": 1237 }, { "epoch": 1.185823754789272, "grad_norm": 6.139298915863037, "learning_rate": 2.005263157894737e-06, "loss": 0.4798, "step": 1238 }, { "epoch": 1.185823754789272, "loss_full_dim": 0.2519037127494812, "loss_main": 0.5169504284858704, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26504671573638916, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.984375, "step": 1238 }, { "epoch": 1.1867816091954022, "grad_norm": 9.789909362792969, "learning_rate": 2.0026315789473683e-06, "loss": 0.517, "step": 1239 }, { "epoch": 1.1867816091954022, "loss_full_dim": 0.30647850036621094, "loss_main": 0.6289407014846802, "loss_parscale": 0.63671875, "loss_sub_dim": 0.32246217131614685, "loss_vclub": 0.000888824462890625, "parscale_sim": 0.984375, "step": 1239 }, { "epoch": 1.1877394636015326, "grad_norm": 5.837466716766357, "learning_rate": 2.0000000000000003e-06, "loss": 0.6289, "step": 1240 }, { "epoch": 1.1877394636015326, "loss_full_dim": 0.29317334294319153, "loss_main": 0.5979599952697754, "loss_parscale": 0.59375, "loss_sub_dim": 0.3047866225242615, "loss_vclub": 0.000965118408203125, "parscale_sim": 0.984375, "step": 1240 }, { "epoch": 1.1886973180076628, "grad_norm": 5.449151992797852, "learning_rate": 1.997368421052632e-06, "loss": 0.598, "step": 1241 }, { "epoch": 1.1886973180076628, "loss_full_dim": 0.25306254625320435, "loss_main": 0.5191028118133545, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26604029536247253, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.984375, "step": 1241 }, { "epoch": 1.1896551724137931, "grad_norm": 9.648698806762695, "learning_rate": 1.994736842105263e-06, "loss": 0.5191, "step": 1242 }, { "epoch": 1.1896551724137931, "loss_full_dim": 0.28798773884773254, "loss_main": 0.5890753865242004, "loss_parscale": 0.59765625, "loss_sub_dim": 0.3010876476764679, "loss_vclub": 0.000732421875, "parscale_sim": 0.98046875, "step": 1242 }, { "epoch": 1.1906130268199233, "grad_norm": 8.353065490722656, "learning_rate": 1.992105263157895e-06, "loss": 0.5891, "step": 1243 }, { "epoch": 1.1906130268199233, "loss_full_dim": 0.2501082420349121, "loss_main": 0.5127418041229248, "loss_parscale": 0.51171875, "loss_sub_dim": 0.2626335620880127, "loss_vclub": 0.00103759765625, "parscale_sim": 0.9765625, "step": 1243 }, { "epoch": 1.1915708812260537, "grad_norm": 9.1087646484375, "learning_rate": 1.9894736842105262e-06, "loss": 0.5127, "step": 1244 }, { "epoch": 1.1915708812260537, "loss_full_dim": 0.26522159576416016, "loss_main": 0.5440217852592468, "loss_parscale": 0.5390625, "loss_sub_dim": 0.27880018949508667, "loss_vclub": 0.000682830810546875, "parscale_sim": 0.984375, "step": 1244 }, { "epoch": 1.1925287356321839, "grad_norm": 4.88273811340332, "learning_rate": 1.9868421052631582e-06, "loss": 0.544, "step": 1245 }, { "epoch": 1.1925287356321839, "loss_full_dim": 0.27384230494499207, "loss_main": 0.5613325834274292, "loss_parscale": 0.5625, "loss_sub_dim": 0.28749027848243713, "loss_vclub": 0.000797271728515625, "parscale_sim": 0.98828125, "step": 1245 }, { "epoch": 1.1934865900383143, "grad_norm": 11.263348579406738, "learning_rate": 1.9842105263157894e-06, "loss": 0.5613, "step": 1246 }, { "epoch": 1.1934865900383143, "loss_full_dim": 0.28566813468933105, "loss_main": 0.5844497680664062, "loss_parscale": 0.59375, "loss_sub_dim": 0.2987816035747528, "loss_vclub": 0.000823974609375, "parscale_sim": 0.98828125, "step": 1246 }, { "epoch": 1.1944444444444444, "grad_norm": 7.250735759735107, "learning_rate": 1.9815789473684214e-06, "loss": 0.5844, "step": 1247 }, { "epoch": 1.1944444444444444, "loss_full_dim": 0.3045486509799957, "loss_main": 0.6210227012634277, "loss_parscale": 0.625, "loss_sub_dim": 0.3164740204811096, "loss_vclub": 0.00093841552734375, "parscale_sim": 0.98046875, "step": 1247 }, { "epoch": 1.1954022988505748, "grad_norm": 7.374420166015625, "learning_rate": 1.978947368421053e-06, "loss": 0.621, "step": 1248 }, { "epoch": 1.1954022988505748, "loss_full_dim": 0.29562363028526306, "loss_main": 0.6046196818351746, "loss_parscale": 0.60546875, "loss_sub_dim": 0.3089960515499115, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.984375, "step": 1248 }, { "epoch": 1.196360153256705, "grad_norm": 8.936529159545898, "learning_rate": 1.976315789473684e-06, "loss": 0.6046, "step": 1249 }, { "epoch": 1.196360153256705, "loss_full_dim": 0.312436044216156, "loss_main": 0.6372085809707642, "loss_parscale": 0.63671875, "loss_sub_dim": 0.32477253675460815, "loss_vclub": 0.00091552734375, "parscale_sim": 0.984375, "step": 1249 }, { "epoch": 1.1973180076628354, "grad_norm": 10.899024963378906, "learning_rate": 1.973684210526316e-06, "loss": 0.6372, "step": 1250 }, { "epoch": 1.1973180076628354, "loss_full_dim": 0.268485426902771, "loss_main": 0.550788164138794, "loss_parscale": 0.5546875, "loss_sub_dim": 0.28230273723602295, "loss_vclub": 0.000949859619140625, "parscale_sim": 0.98046875, "step": 1250 }, { "epoch": 1.1982758620689655, "grad_norm": 5.59716272354126, "learning_rate": 1.9710526315789473e-06, "loss": 0.5508, "step": 1251 }, { "epoch": 1.1982758620689655, "loss_full_dim": 0.24362565577030182, "loss_main": 0.4986386299133301, "loss_parscale": 0.50390625, "loss_sub_dim": 0.25501295924186707, "loss_vclub": 0.000789642333984375, "parscale_sim": 0.984375, "step": 1251 }, { "epoch": 1.1992337164750957, "grad_norm": 6.718475818634033, "learning_rate": 1.9684210526315793e-06, "loss": 0.4986, "step": 1252 }, { "epoch": 1.1992337164750957, "loss_full_dim": 0.2436511367559433, "loss_main": 0.5005275011062622, "loss_parscale": 0.50390625, "loss_sub_dim": 0.2568763494491577, "loss_vclub": 0.0008392333984375, "parscale_sim": 0.984375, "step": 1252 }, { "epoch": 1.200191570881226, "grad_norm": 28.52167320251465, "learning_rate": 1.9657894736842105e-06, "loss": 0.5005, "step": 1253 }, { "epoch": 1.200191570881226, "loss_full_dim": 0.2893209159374237, "loss_main": 0.592894434928894, "loss_parscale": 0.59375, "loss_sub_dim": 0.30357348918914795, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.984375, "step": 1253 }, { "epoch": 1.2011494252873562, "grad_norm": 5.637784481048584, "learning_rate": 1.9631578947368425e-06, "loss": 0.5929, "step": 1254 }, { "epoch": 1.2011494252873562, "loss_full_dim": 0.2802206575870514, "loss_main": 0.5718541145324707, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2916334271430969, "loss_vclub": 0.000789642333984375, "parscale_sim": 0.98046875, "step": 1254 }, { "epoch": 1.2021072796934866, "grad_norm": 7.167033672332764, "learning_rate": 1.9605263157894736e-06, "loss": 0.5719, "step": 1255 }, { "epoch": 1.2021072796934866, "loss_full_dim": 0.2576953172683716, "loss_main": 0.525962233543396, "loss_parscale": 0.52734375, "loss_sub_dim": 0.268266886472702, "loss_vclub": 0.000904083251953125, "parscale_sim": 0.98828125, "step": 1255 }, { "epoch": 1.2030651340996168, "grad_norm": 6.81175422668457, "learning_rate": 1.9578947368421052e-06, "loss": 0.526, "step": 1256 }, { "epoch": 1.2030651340996168, "loss_full_dim": 0.2557185888290405, "loss_main": 0.5218034982681274, "loss_parscale": 0.5234375, "loss_sub_dim": 0.2660849392414093, "loss_vclub": 0.00091552734375, "parscale_sim": 0.984375, "step": 1256 }, { "epoch": 1.2040229885057472, "grad_norm": 6.1843791007995605, "learning_rate": 1.9552631578947372e-06, "loss": 0.5218, "step": 1257 }, { "epoch": 1.2040229885057472, "loss_full_dim": 0.29457080364227295, "loss_main": 0.602822482585907, "loss_parscale": 0.6171875, "loss_sub_dim": 0.30825167894363403, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.9765625, "step": 1257 }, { "epoch": 1.2049808429118773, "grad_norm": 7.067539215087891, "learning_rate": 1.9526315789473684e-06, "loss": 0.6028, "step": 1258 }, { "epoch": 1.2049808429118773, "loss_full_dim": 0.3061314821243286, "loss_main": 0.6256698369979858, "loss_parscale": 0.62890625, "loss_sub_dim": 0.31953832507133484, "loss_vclub": 0.00093841552734375, "parscale_sim": 0.98828125, "step": 1258 }, { "epoch": 1.2059386973180077, "grad_norm": 6.367212295532227, "learning_rate": 1.9500000000000004e-06, "loss": 0.6257, "step": 1259 }, { "epoch": 1.2059386973180077, "loss_full_dim": 0.29022079706192017, "loss_main": 0.5936248302459717, "loss_parscale": 0.59375, "loss_sub_dim": 0.3034040331840515, "loss_vclub": 0.000804901123046875, "parscale_sim": 0.98828125, "step": 1259 }, { "epoch": 1.206896551724138, "grad_norm": 7.527906894683838, "learning_rate": 1.9473684210526315e-06, "loss": 0.5936, "step": 1260 }, { "epoch": 1.206896551724138, "loss_full_dim": 0.25415581464767456, "loss_main": 0.520190954208374, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26603516936302185, "loss_vclub": 0.0008392333984375, "parscale_sim": 0.98828125, "step": 1260 }, { "epoch": 1.2078544061302683, "grad_norm": 7.396082878112793, "learning_rate": 1.9447368421052636e-06, "loss": 0.5202, "step": 1261 }, { "epoch": 1.2078544061302683, "loss_full_dim": 0.2456897646188736, "loss_main": 0.5042834281921387, "loss_parscale": 0.515625, "loss_sub_dim": 0.25859367847442627, "loss_vclub": 0.00103759765625, "parscale_sim": 0.98828125, "step": 1261 }, { "epoch": 1.2088122605363985, "grad_norm": 8.166561126708984, "learning_rate": 1.9421052631578947e-06, "loss": 0.5043, "step": 1262 }, { "epoch": 1.2088122605363985, "loss_full_dim": 0.2871556878089905, "loss_main": 0.5877722501754761, "loss_parscale": 0.5859375, "loss_sub_dim": 0.3006165623664856, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.984375, "step": 1262 }, { "epoch": 1.2097701149425286, "grad_norm": 4.2421555519104, "learning_rate": 1.9394736842105263e-06, "loss": 0.5878, "step": 1263 }, { "epoch": 1.2097701149425286, "loss_full_dim": 0.29420119524002075, "loss_main": 0.6024352312088013, "loss_parscale": 0.6015625, "loss_sub_dim": 0.3082340657711029, "loss_vclub": 0.000858306884765625, "parscale_sim": 0.9765625, "step": 1263 }, { "epoch": 1.210727969348659, "grad_norm": 13.984384536743164, "learning_rate": 1.936842105263158e-06, "loss": 0.6024, "step": 1264 }, { "epoch": 1.210727969348659, "loss_full_dim": 0.32020464539527893, "loss_main": 0.6541991233825684, "loss_parscale": 0.66015625, "loss_sub_dim": 0.3339945077896118, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.984375, "step": 1264 }, { "epoch": 1.2116858237547894, "grad_norm": 12.05805492401123, "learning_rate": 1.9342105263157895e-06, "loss": 0.6542, "step": 1265 }, { "epoch": 1.2116858237547894, "loss_full_dim": 0.30263885855674744, "loss_main": 0.6184262037277222, "loss_parscale": 0.625, "loss_sub_dim": 0.31578731536865234, "loss_vclub": 0.0008392333984375, "parscale_sim": 0.984375, "step": 1265 }, { "epoch": 1.2126436781609196, "grad_norm": 9.46151351928711, "learning_rate": 1.9315789473684215e-06, "loss": 0.6184, "step": 1266 }, { "epoch": 1.2126436781609196, "loss_full_dim": 0.2879517674446106, "loss_main": 0.5883126258850098, "loss_parscale": 0.58984375, "loss_sub_dim": 0.30036085844039917, "loss_vclub": 0.00081634521484375, "parscale_sim": 0.96875, "step": 1266 }, { "epoch": 1.2136015325670497, "grad_norm": 7.991677761077881, "learning_rate": 1.9289473684210526e-06, "loss": 0.5883, "step": 1267 }, { "epoch": 1.2136015325670497, "loss_full_dim": 0.27160170674324036, "loss_main": 0.5541746020317078, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2825728952884674, "loss_vclub": 0.0010223388671875, "parscale_sim": 0.98828125, "step": 1267 }, { "epoch": 1.21455938697318, "grad_norm": 9.327953338623047, "learning_rate": 1.9263157894736846e-06, "loss": 0.5542, "step": 1268 }, { "epoch": 1.21455938697318, "loss_full_dim": 0.37709373235702515, "loss_main": 0.7682386636734009, "loss_parscale": 0.76171875, "loss_sub_dim": 0.39114490151405334, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.9765625, "step": 1268 }, { "epoch": 1.2155172413793103, "grad_norm": 5.813579559326172, "learning_rate": 1.9236842105263158e-06, "loss": 0.7682, "step": 1269 }, { "epoch": 1.2155172413793103, "loss_full_dim": 0.24437730014324188, "loss_main": 0.4994892477989197, "loss_parscale": 0.49609375, "loss_sub_dim": 0.2551119327545166, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.98828125, "step": 1269 }, { "epoch": 1.2164750957854407, "grad_norm": 5.248595714569092, "learning_rate": 1.9210526315789474e-06, "loss": 0.4995, "step": 1270 }, { "epoch": 1.2164750957854407, "loss_full_dim": 0.2895762324333191, "loss_main": 0.5925171375274658, "loss_parscale": 0.58984375, "loss_sub_dim": 0.30294090509414673, "loss_vclub": 0.000827789306640625, "parscale_sim": 0.984375, "step": 1270 }, { "epoch": 1.2174329501915708, "grad_norm": 5.104273319244385, "learning_rate": 1.918421052631579e-06, "loss": 0.5925, "step": 1271 }, { "epoch": 1.2174329501915708, "loss_full_dim": 0.31891441345214844, "loss_main": 0.6496196985244751, "loss_parscale": 0.66015625, "loss_sub_dim": 0.33070528507232666, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.984375, "step": 1271 }, { "epoch": 1.2183908045977012, "grad_norm": 7.205747127532959, "learning_rate": 1.9157894736842105e-06, "loss": 0.6496, "step": 1272 }, { "epoch": 1.2183908045977012, "loss_full_dim": 0.2389478236436844, "loss_main": 0.48959940671920776, "loss_parscale": 0.49609375, "loss_sub_dim": 0.25065159797668457, "loss_vclub": 0.000888824462890625, "parscale_sim": 0.98828125, "step": 1272 }, { "epoch": 1.2193486590038314, "grad_norm": 7.696041584014893, "learning_rate": 1.9131578947368425e-06, "loss": 0.4896, "step": 1273 }, { "epoch": 1.2193486590038314, "loss_full_dim": 0.3078078031539917, "loss_main": 0.6286186575889587, "loss_parscale": 0.625, "loss_sub_dim": 0.32081085443496704, "loss_vclub": 0.00081634521484375, "parscale_sim": 0.984375, "step": 1273 }, { "epoch": 1.2203065134099618, "grad_norm": 9.047403335571289, "learning_rate": 1.9105263157894737e-06, "loss": 0.6286, "step": 1274 }, { "epoch": 1.2203065134099618, "loss_full_dim": 0.2746238708496094, "loss_main": 0.5617977380752563, "loss_parscale": 0.56640625, "loss_sub_dim": 0.28717389702796936, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.984375, "step": 1274 }, { "epoch": 1.221264367816092, "grad_norm": 8.230570793151855, "learning_rate": 1.9078947368421057e-06, "loss": 0.5618, "step": 1275 }, { "epoch": 1.221264367816092, "loss_full_dim": 0.29168492555618286, "loss_main": 0.598721444606781, "loss_parscale": 0.6015625, "loss_sub_dim": 0.30703651905059814, "loss_vclub": 0.000835418701171875, "parscale_sim": 0.98828125, "step": 1275 }, { "epoch": 1.2222222222222223, "grad_norm": 7.35666561126709, "learning_rate": 1.905263157894737e-06, "loss": 0.5987, "step": 1276 }, { "epoch": 1.2222222222222223, "loss_full_dim": 0.28899407386779785, "loss_main": 0.5907653570175171, "loss_parscale": 0.59375, "loss_sub_dim": 0.3017713129520416, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.98828125, "step": 1276 }, { "epoch": 1.2231800766283525, "grad_norm": 8.296487808227539, "learning_rate": 1.9026315789473684e-06, "loss": 0.5908, "step": 1277 }, { "epoch": 1.2231800766283525, "loss_full_dim": 0.34392645955085754, "loss_main": 0.7012381553649902, "loss_parscale": 0.703125, "loss_sub_dim": 0.3573117256164551, "loss_vclub": 0.00092315673828125, "parscale_sim": 0.98046875, "step": 1277 }, { "epoch": 1.2241379310344827, "grad_norm": 9.74915885925293, "learning_rate": 1.9000000000000002e-06, "loss": 0.7012, "step": 1278 }, { "epoch": 1.2241379310344827, "loss_full_dim": 0.30976366996765137, "loss_main": 0.6318866014480591, "loss_parscale": 0.6328125, "loss_sub_dim": 0.3221229314804077, "loss_vclub": 0.00084686279296875, "parscale_sim": 0.98828125, "step": 1278 }, { "epoch": 1.225095785440613, "grad_norm": 9.092549324035645, "learning_rate": 1.8973684210526316e-06, "loss": 0.6319, "step": 1279 }, { "epoch": 1.225095785440613, "loss_full_dim": 0.26804909110069275, "loss_main": 0.5488641262054443, "loss_parscale": 0.5546875, "loss_sub_dim": 0.280815064907074, "loss_vclub": 0.0008544921875, "parscale_sim": 0.98828125, "step": 1279 }, { "epoch": 1.2260536398467432, "grad_norm": 4.381996154785156, "learning_rate": 1.8947368421052634e-06, "loss": 0.5489, "step": 1280 }, { "epoch": 1.2260536398467432, "loss_full_dim": 0.30271974205970764, "loss_main": 0.6175384521484375, "loss_parscale": 0.62109375, "loss_sub_dim": 0.31481873989105225, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.984375, "step": 1280 }, { "epoch": 1.2270114942528736, "grad_norm": 5.494359016418457, "learning_rate": 1.8921052631578948e-06, "loss": 0.6175, "step": 1281 }, { "epoch": 1.2270114942528736, "loss_full_dim": 0.25413304567337036, "loss_main": 0.5202577114105225, "loss_parscale": 0.53125, "loss_sub_dim": 0.2661246657371521, "loss_vclub": 0.000751495361328125, "parscale_sim": 0.97265625, "step": 1281 }, { "epoch": 1.2279693486590038, "grad_norm": 4.946822643280029, "learning_rate": 1.8894736842105266e-06, "loss": 0.5203, "step": 1282 }, { "epoch": 1.2279693486590038, "loss_full_dim": 0.29014867544174194, "loss_main": 0.591856062412262, "loss_parscale": 0.59765625, "loss_sub_dim": 0.30170738697052, "loss_vclub": 0.000904083251953125, "parscale_sim": 0.984375, "step": 1282 }, { "epoch": 1.2289272030651341, "grad_norm": 14.195136070251465, "learning_rate": 1.886842105263158e-06, "loss": 0.5919, "step": 1283 }, { "epoch": 1.2289272030651341, "loss_full_dim": 0.2775721549987793, "loss_main": 0.5707615613937378, "loss_parscale": 0.578125, "loss_sub_dim": 0.2931894063949585, "loss_vclub": 0.000675201416015625, "parscale_sim": 0.984375, "step": 1283 }, { "epoch": 1.2298850574712643, "grad_norm": 8.373260498046875, "learning_rate": 1.8842105263157895e-06, "loss": 0.5708, "step": 1284 }, { "epoch": 1.2298850574712643, "loss_full_dim": 0.2785400450229645, "loss_main": 0.569911777973175, "loss_parscale": 0.5703125, "loss_sub_dim": 0.29137173295021057, "loss_vclub": 0.00092315673828125, "parscale_sim": 0.98828125, "step": 1284 }, { "epoch": 1.2308429118773947, "grad_norm": 6.048569679260254, "learning_rate": 1.8815789473684213e-06, "loss": 0.5699, "step": 1285 }, { "epoch": 1.2308429118773947, "loss_full_dim": 0.2677006721496582, "loss_main": 0.5483510494232178, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2806503474712372, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.98828125, "step": 1285 }, { "epoch": 1.2318007662835249, "grad_norm": 5.6308183670043945, "learning_rate": 1.8789473684210527e-06, "loss": 0.5484, "step": 1286 }, { "epoch": 1.2318007662835249, "loss_full_dim": 0.2622283399105072, "loss_main": 0.5351389646530151, "loss_parscale": 0.53125, "loss_sub_dim": 0.2729106545448303, "loss_vclub": 0.000865936279296875, "parscale_sim": 0.984375, "step": 1286 }, { "epoch": 1.2327586206896552, "grad_norm": 8.173762321472168, "learning_rate": 1.8763157894736845e-06, "loss": 0.5351, "step": 1287 }, { "epoch": 1.2327586206896552, "loss_full_dim": 0.25770682096481323, "loss_main": 0.5284966826438904, "loss_parscale": 0.52734375, "loss_sub_dim": 0.27078986167907715, "loss_vclub": 0.00089263916015625, "parscale_sim": 0.984375, "step": 1287 }, { "epoch": 1.2337164750957854, "grad_norm": 7.251173973083496, "learning_rate": 1.8736842105263158e-06, "loss": 0.5285, "step": 1288 }, { "epoch": 1.2337164750957854, "loss_full_dim": 0.2719252109527588, "loss_main": 0.5543222427368164, "loss_parscale": 0.5546875, "loss_sub_dim": 0.28239706158638, "loss_vclub": 0.000843048095703125, "parscale_sim": 0.984375, "step": 1288 }, { "epoch": 1.2346743295019158, "grad_norm": 8.782171249389648, "learning_rate": 1.8710526315789476e-06, "loss": 0.5543, "step": 1289 }, { "epoch": 1.2346743295019158, "loss_full_dim": 0.27637678384780884, "loss_main": 0.5651393532752991, "loss_parscale": 0.56640625, "loss_sub_dim": 0.28876256942749023, "loss_vclub": 0.000926971435546875, "parscale_sim": 0.98828125, "step": 1289 }, { "epoch": 1.235632183908046, "grad_norm": 5.903568267822266, "learning_rate": 1.868421052631579e-06, "loss": 0.5651, "step": 1290 }, { "epoch": 1.235632183908046, "loss_full_dim": 0.219927579164505, "loss_main": 0.4524696171283722, "loss_parscale": 0.45703125, "loss_sub_dim": 0.2325420379638672, "loss_vclub": 0.000720977783203125, "parscale_sim": 0.984375, "step": 1290 }, { "epoch": 1.2365900383141764, "grad_norm": 15.335436820983887, "learning_rate": 1.8657894736842108e-06, "loss": 0.4525, "step": 1291 }, { "epoch": 1.2365900383141764, "loss_full_dim": 0.29998254776000977, "loss_main": 0.6152293682098389, "loss_parscale": 0.6171875, "loss_sub_dim": 0.3152468204498291, "loss_vclub": 0.00091552734375, "parscale_sim": 0.984375, "step": 1291 }, { "epoch": 1.2375478927203065, "grad_norm": 8.228278160095215, "learning_rate": 1.8631578947368424e-06, "loss": 0.6152, "step": 1292 }, { "epoch": 1.2375478927203065, "loss_full_dim": 0.3000749945640564, "loss_main": 0.6131579279899597, "loss_parscale": 0.62109375, "loss_sub_dim": 0.3130829334259033, "loss_vclub": 0.00075531005859375, "parscale_sim": 0.98828125, "step": 1292 }, { "epoch": 1.2385057471264367, "grad_norm": 5.871972560882568, "learning_rate": 1.8605263157894737e-06, "loss": 0.6132, "step": 1293 }, { "epoch": 1.2385057471264367, "loss_full_dim": 0.3055157959461212, "loss_main": 0.6247552633285522, "loss_parscale": 0.62890625, "loss_sub_dim": 0.31923943758010864, "loss_vclub": 0.00084686279296875, "parscale_sim": 0.98828125, "step": 1293 }, { "epoch": 1.239463601532567, "grad_norm": 8.646077156066895, "learning_rate": 1.8578947368421055e-06, "loss": 0.6248, "step": 1294 }, { "epoch": 1.239463601532567, "loss_full_dim": 0.2773681581020355, "loss_main": 0.5692466497421265, "loss_parscale": 0.578125, "loss_sub_dim": 0.29187846183776855, "loss_vclub": 0.001007080078125, "parscale_sim": 0.98046875, "step": 1294 }, { "epoch": 1.2404214559386972, "grad_norm": 7.795206546783447, "learning_rate": 1.855263157894737e-06, "loss": 0.5692, "step": 1295 }, { "epoch": 1.2404214559386972, "loss_full_dim": 0.32844266295433044, "loss_main": 0.6694017648696899, "loss_parscale": 0.6640625, "loss_sub_dim": 0.3409591317176819, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.984375, "step": 1295 }, { "epoch": 1.2413793103448276, "grad_norm": 9.321011543273926, "learning_rate": 1.8526315789473687e-06, "loss": 0.6694, "step": 1296 }, { "epoch": 1.2413793103448276, "loss_full_dim": 0.28254997730255127, "loss_main": 0.5785168409347534, "loss_parscale": 0.578125, "loss_sub_dim": 0.29596689343452454, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.984375, "step": 1296 }, { "epoch": 1.2423371647509578, "grad_norm": 8.146695137023926, "learning_rate": 1.85e-06, "loss": 0.5785, "step": 1297 }, { "epoch": 1.2423371647509578, "loss_full_dim": 0.3094055950641632, "loss_main": 0.6309900283813477, "loss_parscale": 0.63671875, "loss_sub_dim": 0.32158446311950684, "loss_vclub": 0.00079345703125, "parscale_sim": 0.984375, "step": 1297 }, { "epoch": 1.2432950191570882, "grad_norm": 8.73775577545166, "learning_rate": 1.8473684210526319e-06, "loss": 0.631, "step": 1298 }, { "epoch": 1.2432950191570882, "loss_full_dim": 0.2522459924221039, "loss_main": 0.5161575078964233, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26391154527664185, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.98828125, "step": 1298 }, { "epoch": 1.2442528735632183, "grad_norm": 6.351936340332031, "learning_rate": 1.8447368421052632e-06, "loss": 0.5162, "step": 1299 }, { "epoch": 1.2442528735632183, "loss_full_dim": 0.30646345019340515, "loss_main": 0.6275368928909302, "loss_parscale": 0.6328125, "loss_sub_dim": 0.321073442697525, "loss_vclub": 0.000885009765625, "parscale_sim": 0.98828125, "step": 1299 }, { "epoch": 1.2452107279693487, "grad_norm": 6.854035377502441, "learning_rate": 1.8421052631578948e-06, "loss": 0.6275, "step": 1300 }, { "epoch": 1.2452107279693487, "loss_full_dim": 0.30429521203041077, "loss_main": 0.6217790246009827, "loss_parscale": 0.62890625, "loss_sub_dim": 0.3174838125705719, "loss_vclub": 0.000827789306640625, "parscale_sim": 0.984375, "step": 1300 }, { "epoch": 1.246168582375479, "grad_norm": 4.220168113708496, "learning_rate": 1.8394736842105266e-06, "loss": 0.6218, "step": 1301 }, { "epoch": 1.246168582375479, "loss_full_dim": 0.29178282618522644, "loss_main": 0.5954152345657349, "loss_parscale": 0.59375, "loss_sub_dim": 0.3036324381828308, "loss_vclub": 0.000797271728515625, "parscale_sim": 0.9765625, "step": 1301 }, { "epoch": 1.2471264367816093, "grad_norm": 6.315422534942627, "learning_rate": 1.836842105263158e-06, "loss": 0.5954, "step": 1302 }, { "epoch": 1.2471264367816093, "loss_full_dim": 0.2554935812950134, "loss_main": 0.5234264731407166, "loss_parscale": 0.53125, "loss_sub_dim": 0.2679328918457031, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98046875, "step": 1302 }, { "epoch": 1.2480842911877394, "grad_norm": 5.528379440307617, "learning_rate": 1.8342105263157898e-06, "loss": 0.5234, "step": 1303 }, { "epoch": 1.2480842911877394, "loss_full_dim": 0.28887802362442017, "loss_main": 0.5918742418289185, "loss_parscale": 0.59375, "loss_sub_dim": 0.3029962182044983, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.984375, "step": 1303 }, { "epoch": 1.2490421455938696, "grad_norm": 7.816915512084961, "learning_rate": 1.8315789473684211e-06, "loss": 0.5919, "step": 1304 }, { "epoch": 1.2490421455938696, "loss_full_dim": 0.270219624042511, "loss_main": 0.5529510378837585, "loss_parscale": 0.5546875, "loss_sub_dim": 0.28273141384124756, "loss_vclub": 0.0009613037109375, "parscale_sim": 0.984375, "step": 1304 }, { "epoch": 1.25, "grad_norm": 5.8572468757629395, "learning_rate": 1.828947368421053e-06, "loss": 0.553, "step": 1305 }, { "epoch": 1.25, "loss_full_dim": 0.2857021391391754, "loss_main": 0.5834689140319824, "loss_parscale": 0.58984375, "loss_sub_dim": 0.2977667450904846, "loss_vclub": 0.000736236572265625, "parscale_sim": 0.98046875, "step": 1305 }, { "epoch": 1.2509578544061304, "grad_norm": 8.600815773010254, "learning_rate": 1.8263157894736843e-06, "loss": 0.5835, "step": 1306 }, { "epoch": 1.2509578544061304, "loss_full_dim": 0.2673030197620392, "loss_main": 0.5468466281890869, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2795436382293701, "loss_vclub": 0.000965118408203125, "parscale_sim": 0.98046875, "step": 1306 }, { "epoch": 1.2519157088122606, "grad_norm": 8.475868225097656, "learning_rate": 1.8236842105263159e-06, "loss": 0.5468, "step": 1307 }, { "epoch": 1.2519157088122606, "loss_full_dim": 0.23954838514328003, "loss_main": 0.4911397099494934, "loss_parscale": 0.50390625, "loss_sub_dim": 0.2515913248062134, "loss_vclub": 0.000675201416015625, "parscale_sim": 0.984375, "step": 1307 }, { "epoch": 1.2528735632183907, "grad_norm": 10.348819732666016, "learning_rate": 1.8210526315789475e-06, "loss": 0.4911, "step": 1308 }, { "epoch": 1.2528735632183907, "loss_full_dim": 0.28682637214660645, "loss_main": 0.5854896306991577, "loss_parscale": 0.578125, "loss_sub_dim": 0.29866325855255127, "loss_vclub": 0.0010223388671875, "parscale_sim": 0.98828125, "step": 1308 }, { "epoch": 1.253831417624521, "grad_norm": 7.230132579803467, "learning_rate": 1.818421052631579e-06, "loss": 0.5855, "step": 1309 }, { "epoch": 1.253831417624521, "loss_full_dim": 0.2963903248310089, "loss_main": 0.6059867143630981, "loss_parscale": 0.6171875, "loss_sub_dim": 0.3095964193344116, "loss_vclub": 0.0008392333984375, "parscale_sim": 0.984375, "step": 1309 }, { "epoch": 1.2547892720306513, "grad_norm": 7.400805950164795, "learning_rate": 1.8157894736842109e-06, "loss": 0.606, "step": 1310 }, { "epoch": 1.2547892720306513, "loss_full_dim": 0.2818067967891693, "loss_main": 0.5775273442268372, "loss_parscale": 0.5859375, "loss_sub_dim": 0.29572054743766785, "loss_vclub": 0.000743865966796875, "parscale_sim": 0.98828125, "step": 1310 }, { "epoch": 1.2557471264367817, "grad_norm": 6.080440998077393, "learning_rate": 1.8131578947368422e-06, "loss": 0.5775, "step": 1311 }, { "epoch": 1.2557471264367817, "loss_full_dim": 0.30504700541496277, "loss_main": 0.6221354007720947, "loss_parscale": 0.625, "loss_sub_dim": 0.31708836555480957, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.984375, "step": 1311 }, { "epoch": 1.2567049808429118, "grad_norm": 4.261111259460449, "learning_rate": 1.810526315789474e-06, "loss": 0.6221, "step": 1312 }, { "epoch": 1.2567049808429118, "loss_full_dim": 0.28362149000167847, "loss_main": 0.577678382396698, "loss_parscale": 0.5859375, "loss_sub_dim": 0.29405689239501953, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.984375, "step": 1312 }, { "epoch": 1.2576628352490422, "grad_norm": 7.96189022064209, "learning_rate": 1.8078947368421054e-06, "loss": 0.5777, "step": 1313 }, { "epoch": 1.2576628352490422, "loss_full_dim": 0.31375545263290405, "loss_main": 0.6406230330467224, "loss_parscale": 0.640625, "loss_sub_dim": 0.32686758041381836, "loss_vclub": 0.000972747802734375, "parscale_sim": 0.98828125, "step": 1313 }, { "epoch": 1.2586206896551724, "grad_norm": 26.792333602905273, "learning_rate": 1.805263157894737e-06, "loss": 0.6406, "step": 1314 }, { "epoch": 1.2586206896551724, "loss_full_dim": 0.296190470457077, "loss_main": 0.6069326400756836, "loss_parscale": 0.61328125, "loss_sub_dim": 0.31074216961860657, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.984375, "step": 1314 }, { "epoch": 1.2595785440613028, "grad_norm": 5.835477352142334, "learning_rate": 1.8026315789473685e-06, "loss": 0.6069, "step": 1315 }, { "epoch": 1.2595785440613028, "loss_full_dim": 0.2709599435329437, "loss_main": 0.5544854402542114, "loss_parscale": 0.5625, "loss_sub_dim": 0.2835254669189453, "loss_vclub": 0.000896453857421875, "parscale_sim": 0.984375, "step": 1315 }, { "epoch": 1.260536398467433, "grad_norm": 11.13095474243164, "learning_rate": 1.8000000000000001e-06, "loss": 0.5545, "step": 1316 }, { "epoch": 1.260536398467433, "loss_full_dim": 0.2607796788215637, "loss_main": 0.5335643887519836, "loss_parscale": 0.5390625, "loss_sub_dim": 0.2727847099304199, "loss_vclub": 0.00081634521484375, "parscale_sim": 0.98046875, "step": 1316 }, { "epoch": 1.2614942528735633, "grad_norm": 5.811164379119873, "learning_rate": 1.7973684210526317e-06, "loss": 0.5336, "step": 1317 }, { "epoch": 1.2614942528735633, "loss_full_dim": 0.2676297426223755, "loss_main": 0.5485612154006958, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2809314727783203, "loss_vclub": 0.00089263916015625, "parscale_sim": 0.98046875, "step": 1317 }, { "epoch": 1.2624521072796935, "grad_norm": 7.868773937225342, "learning_rate": 1.7947368421052633e-06, "loss": 0.5486, "step": 1318 }, { "epoch": 1.2624521072796935, "loss_full_dim": 0.28708869218826294, "loss_main": 0.5882853269577026, "loss_parscale": 0.59375, "loss_sub_dim": 0.3011966347694397, "loss_vclub": 0.0010528564453125, "parscale_sim": 0.98828125, "step": 1318 }, { "epoch": 1.2634099616858236, "grad_norm": 7.357295989990234, "learning_rate": 1.792105263157895e-06, "loss": 0.5883, "step": 1319 }, { "epoch": 1.2634099616858236, "loss_full_dim": 0.2709163427352905, "loss_main": 0.5513436198234558, "loss_parscale": 0.546875, "loss_sub_dim": 0.2804272770881653, "loss_vclub": 0.00079345703125, "parscale_sim": 0.984375, "step": 1319 }, { "epoch": 1.264367816091954, "grad_norm": 6.547452926635742, "learning_rate": 1.7894736842105265e-06, "loss": 0.5513, "step": 1320 }, { "epoch": 1.264367816091954, "loss_full_dim": 0.33836615085601807, "loss_main": 0.6884469985961914, "loss_parscale": 0.69140625, "loss_sub_dim": 0.3500808775424957, "loss_vclub": 0.00083160400390625, "parscale_sim": 0.984375, "step": 1320 }, { "epoch": 1.2653256704980844, "grad_norm": 11.657613754272461, "learning_rate": 1.7868421052631578e-06, "loss": 0.6884, "step": 1321 }, { "epoch": 1.2653256704980844, "loss_full_dim": 0.3156396448612213, "loss_main": 0.6423545479774475, "loss_parscale": 0.640625, "loss_sub_dim": 0.3267149031162262, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.984375, "step": 1321 }, { "epoch": 1.2662835249042146, "grad_norm": 7.973985195159912, "learning_rate": 1.7842105263157896e-06, "loss": 0.6424, "step": 1322 }, { "epoch": 1.2662835249042146, "loss_full_dim": 0.30044132471084595, "loss_main": 0.6126442551612854, "loss_parscale": 0.625, "loss_sub_dim": 0.31220293045043945, "loss_vclub": 0.000946044921875, "parscale_sim": 0.98828125, "step": 1322 }, { "epoch": 1.2672413793103448, "grad_norm": 8.25383472442627, "learning_rate": 1.7815789473684212e-06, "loss": 0.6126, "step": 1323 }, { "epoch": 1.2672413793103448, "loss_full_dim": 0.27422666549682617, "loss_main": 0.5618752837181091, "loss_parscale": 0.5703125, "loss_sub_dim": 0.28764861822128296, "loss_vclub": 0.00096893310546875, "parscale_sim": 0.984375, "step": 1323 }, { "epoch": 1.2681992337164751, "grad_norm": 5.424323081970215, "learning_rate": 1.7789473684210528e-06, "loss": 0.5619, "step": 1324 }, { "epoch": 1.2681992337164751, "loss_full_dim": 0.2465217411518097, "loss_main": 0.5028454065322876, "loss_parscale": 0.515625, "loss_sub_dim": 0.2563236951828003, "loss_vclub": 0.000820159912109375, "parscale_sim": 0.98046875, "step": 1324 }, { "epoch": 1.2691570881226053, "grad_norm": 7.87506103515625, "learning_rate": 1.7763157894736844e-06, "loss": 0.5028, "step": 1325 }, { "epoch": 1.2691570881226053, "loss_full_dim": 0.25133654475212097, "loss_main": 0.5142462253570557, "loss_parscale": 0.515625, "loss_sub_dim": 0.2629096806049347, "loss_vclub": 0.0010528564453125, "parscale_sim": 0.98828125, "step": 1325 }, { "epoch": 1.2701149425287357, "grad_norm": 5.9688639640808105, "learning_rate": 1.7736842105263162e-06, "loss": 0.5142, "step": 1326 }, { "epoch": 1.2701149425287357, "loss_full_dim": 0.2832977771759033, "loss_main": 0.5810834169387817, "loss_parscale": 0.5859375, "loss_sub_dim": 0.2977856397628784, "loss_vclub": 0.000820159912109375, "parscale_sim": 0.98828125, "step": 1326 }, { "epoch": 1.2710727969348659, "grad_norm": 19.495664596557617, "learning_rate": 1.7710526315789475e-06, "loss": 0.5811, "step": 1327 }, { "epoch": 1.2710727969348659, "loss_full_dim": 0.24065786600112915, "loss_main": 0.4913438558578491, "loss_parscale": 0.48828125, "loss_sub_dim": 0.25068598985671997, "loss_vclub": 0.00084686279296875, "parscale_sim": 0.984375, "step": 1327 }, { "epoch": 1.2720306513409962, "grad_norm": 5.137777328491211, "learning_rate": 1.768421052631579e-06, "loss": 0.4913, "step": 1328 }, { "epoch": 1.2720306513409962, "loss_full_dim": 0.35013073682785034, "loss_main": 0.7129306793212891, "loss_parscale": 0.7109375, "loss_sub_dim": 0.3627999722957611, "loss_vclub": 0.000820159912109375, "parscale_sim": 0.984375, "step": 1328 }, { "epoch": 1.2729885057471264, "grad_norm": 4.6097331047058105, "learning_rate": 1.7657894736842107e-06, "loss": 0.7129, "step": 1329 }, { "epoch": 1.2729885057471264, "loss_full_dim": 0.28156912326812744, "loss_main": 0.5770301818847656, "loss_parscale": 0.5859375, "loss_sub_dim": 0.29546108841896057, "loss_vclub": 0.000827789306640625, "parscale_sim": 0.98046875, "step": 1329 }, { "epoch": 1.2739463601532566, "grad_norm": 15.848613739013672, "learning_rate": 1.7631578947368423e-06, "loss": 0.577, "step": 1330 }, { "epoch": 1.2739463601532566, "loss_full_dim": 0.2830670475959778, "loss_main": 0.5789777040481567, "loss_parscale": 0.578125, "loss_sub_dim": 0.29591062664985657, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.98046875, "step": 1330 }, { "epoch": 1.274904214559387, "grad_norm": 10.307331085205078, "learning_rate": 1.7605263157894739e-06, "loss": 0.579, "step": 1331 }, { "epoch": 1.274904214559387, "loss_full_dim": 0.3004641830921173, "loss_main": 0.6152150630950928, "loss_parscale": 0.61328125, "loss_sub_dim": 0.31475090980529785, "loss_vclub": 0.00099945068359375, "parscale_sim": 0.984375, "step": 1331 }, { "epoch": 1.2758620689655173, "grad_norm": 7.474649906158447, "learning_rate": 1.7578947368421054e-06, "loss": 0.6152, "step": 1332 }, { "epoch": 1.2758620689655173, "loss_full_dim": 0.23783482611179352, "loss_main": 0.4874005913734436, "loss_parscale": 0.4921875, "loss_sub_dim": 0.24956578016281128, "loss_vclub": 0.0009307861328125, "parscale_sim": 0.984375, "step": 1332 }, { "epoch": 1.2768199233716475, "grad_norm": 7.057280540466309, "learning_rate": 1.755263157894737e-06, "loss": 0.4874, "step": 1333 }, { "epoch": 1.2768199233716475, "loss_full_dim": 0.3027573227882385, "loss_main": 0.6179839372634888, "loss_parscale": 0.6171875, "loss_sub_dim": 0.31522661447525024, "loss_vclub": 0.00091552734375, "parscale_sim": 0.9765625, "step": 1333 }, { "epoch": 1.2777777777777777, "grad_norm": 24.397789001464844, "learning_rate": 1.7526315789473686e-06, "loss": 0.618, "step": 1334 }, { "epoch": 1.2777777777777777, "loss_full_dim": 0.280997633934021, "loss_main": 0.5722306966781616, "loss_parscale": 0.57421875, "loss_sub_dim": 0.2912330627441406, "loss_vclub": 0.00099945068359375, "parscale_sim": 0.98828125, "step": 1334 }, { "epoch": 1.278735632183908, "grad_norm": 7.9853386878967285, "learning_rate": 1.75e-06, "loss": 0.5722, "step": 1335 }, { "epoch": 1.278735632183908, "loss_full_dim": 0.27100932598114014, "loss_main": 0.553057849407196, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2820485234260559, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.9765625, "step": 1335 }, { "epoch": 1.2796934865900382, "grad_norm": 8.89769458770752, "learning_rate": 1.7473684210526318e-06, "loss": 0.5531, "step": 1336 }, { "epoch": 1.2796934865900382, "loss_full_dim": 0.25755006074905396, "loss_main": 0.5278024077415466, "loss_parscale": 0.53515625, "loss_sub_dim": 0.2702523469924927, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.984375, "step": 1336 }, { "epoch": 1.2806513409961686, "grad_norm": 7.3133955001831055, "learning_rate": 1.7447368421052631e-06, "loss": 0.5278, "step": 1337 }, { "epoch": 1.2806513409961686, "loss_full_dim": 0.23525211215019226, "loss_main": 0.4802888035774231, "loss_parscale": 0.48046875, "loss_sub_dim": 0.24503669142723083, "loss_vclub": 0.000896453857421875, "parscale_sim": 0.98828125, "step": 1337 }, { "epoch": 1.2816091954022988, "grad_norm": 6.486107349395752, "learning_rate": 1.742105263157895e-06, "loss": 0.4803, "step": 1338 }, { "epoch": 1.2816091954022988, "loss_full_dim": 0.27032485604286194, "loss_main": 0.5505756139755249, "loss_parscale": 0.55859375, "loss_sub_dim": 0.28025078773498535, "loss_vclub": 0.000942230224609375, "parscale_sim": 0.98828125, "step": 1338 }, { "epoch": 1.2825670498084292, "grad_norm": 9.264759063720703, "learning_rate": 1.7394736842105265e-06, "loss": 0.5506, "step": 1339 }, { "epoch": 1.2825670498084292, "loss_full_dim": 0.2955835163593292, "loss_main": 0.6046289205551147, "loss_parscale": 0.62109375, "loss_sub_dim": 0.3090454339981079, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.98046875, "step": 1339 }, { "epoch": 1.2835249042145593, "grad_norm": 7.475778102874756, "learning_rate": 1.736842105263158e-06, "loss": 0.6046, "step": 1340 }, { "epoch": 1.2835249042145593, "loss_full_dim": 0.2880864143371582, "loss_main": 0.5874876976013184, "loss_parscale": 0.58203125, "loss_sub_dim": 0.29940125346183777, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.984375, "step": 1340 }, { "epoch": 1.2844827586206897, "grad_norm": 6.836956024169922, "learning_rate": 1.7342105263157897e-06, "loss": 0.5875, "step": 1341 }, { "epoch": 1.2844827586206897, "loss_full_dim": 0.2905111014842987, "loss_main": 0.5930262804031372, "loss_parscale": 0.59765625, "loss_sub_dim": 0.3025151789188385, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.984375, "step": 1341 }, { "epoch": 1.28544061302682, "grad_norm": 9.066161155700684, "learning_rate": 1.731578947368421e-06, "loss": 0.593, "step": 1342 }, { "epoch": 1.28544061302682, "loss_full_dim": 0.30420199036598206, "loss_main": 0.6207351684570312, "loss_parscale": 0.625, "loss_sub_dim": 0.3165332078933716, "loss_vclub": 0.000942230224609375, "parscale_sim": 0.984375, "step": 1342 }, { "epoch": 1.2863984674329503, "grad_norm": 5.454669952392578, "learning_rate": 1.7289473684210528e-06, "loss": 0.6207, "step": 1343 }, { "epoch": 1.2863984674329503, "loss_full_dim": 0.31935328245162964, "loss_main": 0.6527304649353027, "loss_parscale": 0.65625, "loss_sub_dim": 0.3333772122859955, "loss_vclub": 0.000865936279296875, "parscale_sim": 0.984375, "step": 1343 }, { "epoch": 1.2873563218390804, "grad_norm": 7.801322937011719, "learning_rate": 1.7263157894736842e-06, "loss": 0.6527, "step": 1344 }, { "epoch": 1.2873563218390804, "loss_full_dim": 0.34992772340774536, "loss_main": 0.7119834423065186, "loss_parscale": 0.71875, "loss_sub_dim": 0.3620557188987732, "loss_vclub": 0.00102996826171875, "parscale_sim": 0.984375, "step": 1344 }, { "epoch": 1.2883141762452106, "grad_norm": 8.426122665405273, "learning_rate": 1.723684210526316e-06, "loss": 0.712, "step": 1345 }, { "epoch": 1.2883141762452106, "loss_full_dim": 0.3171306550502777, "loss_main": 0.647231936454773, "loss_parscale": 0.65234375, "loss_sub_dim": 0.3301013112068176, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.984375, "step": 1345 }, { "epoch": 1.289272030651341, "grad_norm": 21.636857986450195, "learning_rate": 1.7210526315789474e-06, "loss": 0.6472, "step": 1346 }, { "epoch": 1.289272030651341, "loss_full_dim": 0.2728506624698639, "loss_main": 0.5572527647018433, "loss_parscale": 0.5546875, "loss_sub_dim": 0.28440213203430176, "loss_vclub": 0.0012969970703125, "parscale_sim": 0.984375, "step": 1346 }, { "epoch": 1.2902298850574714, "grad_norm": 8.428197860717773, "learning_rate": 1.7184210526315792e-06, "loss": 0.5573, "step": 1347 }, { "epoch": 1.2902298850574714, "loss_full_dim": 0.2510470747947693, "loss_main": 0.5151964426040649, "loss_parscale": 0.51171875, "loss_sub_dim": 0.26414939761161804, "loss_vclub": 0.0010223388671875, "parscale_sim": 0.984375, "step": 1347 }, { "epoch": 1.2911877394636015, "grad_norm": 4.579853057861328, "learning_rate": 1.7157894736842107e-06, "loss": 0.5152, "step": 1348 }, { "epoch": 1.2911877394636015, "loss_full_dim": 0.27876734733581543, "loss_main": 0.5697875618934631, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2910202145576477, "loss_vclub": 0.00102996826171875, "parscale_sim": 0.984375, "step": 1348 }, { "epoch": 1.2921455938697317, "grad_norm": 17.436372756958008, "learning_rate": 1.7131578947368421e-06, "loss": 0.5698, "step": 1349 }, { "epoch": 1.2921455938697317, "loss_full_dim": 0.2646292746067047, "loss_main": 0.5415854454040527, "loss_parscale": 0.5390625, "loss_sub_dim": 0.2769562005996704, "loss_vclub": 0.000946044921875, "parscale_sim": 0.98828125, "step": 1349 }, { "epoch": 1.293103448275862, "grad_norm": 5.85814094543457, "learning_rate": 1.710526315789474e-06, "loss": 0.5416, "step": 1350 }, { "epoch": 1.293103448275862, "loss_full_dim": 0.3249732553958893, "loss_main": 0.6647764444351196, "loss_parscale": 0.6640625, "loss_sub_dim": 0.33980315923690796, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.984375, "step": 1350 }, { "epoch": 1.2940613026819923, "grad_norm": 6.3976640701293945, "learning_rate": 1.7078947368421053e-06, "loss": 0.6648, "step": 1351 }, { "epoch": 1.2940613026819923, "loss_full_dim": 0.33320632576942444, "loss_main": 0.6803704500198364, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3471640944480896, "loss_vclub": 0.000843048095703125, "parscale_sim": 0.984375, "step": 1351 }, { "epoch": 1.2950191570881227, "grad_norm": 7.872661590576172, "learning_rate": 1.705263157894737e-06, "loss": 0.6804, "step": 1352 }, { "epoch": 1.2950191570881227, "loss_full_dim": 0.2963508069515228, "loss_main": 0.6048550605773926, "loss_parscale": 0.60546875, "loss_sub_dim": 0.30850425362586975, "loss_vclub": 0.000957489013671875, "parscale_sim": 0.98828125, "step": 1352 }, { "epoch": 1.2959770114942528, "grad_norm": 5.708299160003662, "learning_rate": 1.7026315789473684e-06, "loss": 0.6049, "step": 1353 }, { "epoch": 1.2959770114942528, "loss_full_dim": 0.2768666744232178, "loss_main": 0.5675286054611206, "loss_parscale": 0.5703125, "loss_sub_dim": 0.29066193103790283, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.984375, "step": 1353 }, { "epoch": 1.2969348659003832, "grad_norm": 8.116795539855957, "learning_rate": 1.7000000000000002e-06, "loss": 0.5675, "step": 1354 }, { "epoch": 1.2969348659003832, "loss_full_dim": 0.3505675792694092, "loss_main": 0.7142130732536316, "loss_parscale": 0.7109375, "loss_sub_dim": 0.3636454939842224, "loss_vclub": 0.000812530517578125, "parscale_sim": 0.984375, "step": 1354 }, { "epoch": 1.2978927203065134, "grad_norm": 7.4338297843933105, "learning_rate": 1.6973684210526318e-06, "loss": 0.7142, "step": 1355 }, { "epoch": 1.2978927203065134, "loss_full_dim": 0.32517391443252563, "loss_main": 0.6632260084152222, "loss_parscale": 0.66796875, "loss_sub_dim": 0.33805209398269653, "loss_vclub": 0.000946044921875, "parscale_sim": 0.984375, "step": 1355 }, { "epoch": 1.2988505747126438, "grad_norm": 9.334857940673828, "learning_rate": 1.6947368421052632e-06, "loss": 0.6632, "step": 1356 }, { "epoch": 1.2988505747126438, "loss_full_dim": 0.26482275128364563, "loss_main": 0.5436370968818665, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2788143455982208, "loss_vclub": 0.00109100341796875, "parscale_sim": 0.984375, "step": 1356 }, { "epoch": 1.299808429118774, "grad_norm": 9.345372200012207, "learning_rate": 1.692105263157895e-06, "loss": 0.5436, "step": 1357 }, { "epoch": 1.299808429118774, "loss_full_dim": 0.29967227578163147, "loss_main": 0.6160169839859009, "loss_parscale": 0.62890625, "loss_sub_dim": 0.316344678401947, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.984375, "step": 1357 }, { "epoch": 1.3007662835249043, "grad_norm": 9.04637336730957, "learning_rate": 1.6894736842105264e-06, "loss": 0.616, "step": 1358 }, { "epoch": 1.3007662835249043, "loss_full_dim": 0.28871050477027893, "loss_main": 0.5932683944702148, "loss_parscale": 0.6015625, "loss_sub_dim": 0.3045579195022583, "loss_vclub": 0.00107574462890625, "parscale_sim": 0.98046875, "step": 1358 }, { "epoch": 1.3017241379310345, "grad_norm": 10.360981941223145, "learning_rate": 1.6868421052631581e-06, "loss": 0.5933, "step": 1359 }, { "epoch": 1.3017241379310345, "loss_full_dim": 0.2836010158061981, "loss_main": 0.5790395736694336, "loss_parscale": 0.58203125, "loss_sub_dim": 0.2954385280609131, "loss_vclub": 0.0009765625, "parscale_sim": 0.98828125, "step": 1359 }, { "epoch": 1.3026819923371646, "grad_norm": 7.892270565032959, "learning_rate": 1.6842105263157895e-06, "loss": 0.579, "step": 1360 }, { "epoch": 1.3026819923371646, "loss_full_dim": 0.3291223347187042, "loss_main": 0.6707494854927063, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3416271507740021, "loss_vclub": 0.00092315673828125, "parscale_sim": 0.984375, "step": 1360 }, { "epoch": 1.303639846743295, "grad_norm": 7.159830570220947, "learning_rate": 1.6815789473684213e-06, "loss": 0.6707, "step": 1361 }, { "epoch": 1.303639846743295, "loss_full_dim": 0.26496416330337524, "loss_main": 0.5415831208229065, "loss_parscale": 0.5390625, "loss_sub_dim": 0.27661895751953125, "loss_vclub": 0.00083160400390625, "parscale_sim": 0.984375, "step": 1361 }, { "epoch": 1.3045977011494254, "grad_norm": 6.0099568367004395, "learning_rate": 1.6789473684210527e-06, "loss": 0.5416, "step": 1362 }, { "epoch": 1.3045977011494254, "loss_full_dim": 0.2729203701019287, "loss_main": 0.5603217482566833, "loss_parscale": 0.55859375, "loss_sub_dim": 0.28740137815475464, "loss_vclub": 0.00089263916015625, "parscale_sim": 0.98046875, "step": 1362 }, { "epoch": 1.3055555555555556, "grad_norm": 6.937341213226318, "learning_rate": 1.6763157894736843e-06, "loss": 0.5603, "step": 1363 }, { "epoch": 1.3055555555555556, "loss_full_dim": 0.29475924372673035, "loss_main": 0.6017845869064331, "loss_parscale": 0.609375, "loss_sub_dim": 0.30702534317970276, "loss_vclub": 0.000804901123046875, "parscale_sim": 0.98046875, "step": 1363 }, { "epoch": 1.3065134099616857, "grad_norm": 5.906900882720947, "learning_rate": 1.673684210526316e-06, "loss": 0.6018, "step": 1364 }, { "epoch": 1.3065134099616857, "loss_full_dim": 0.25003528594970703, "loss_main": 0.515511691570282, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26547640562057495, "loss_vclub": 0.00099945068359375, "parscale_sim": 0.98828125, "step": 1364 }, { "epoch": 1.3074712643678161, "grad_norm": 13.194698333740234, "learning_rate": 1.6710526315789474e-06, "loss": 0.5155, "step": 1365 }, { "epoch": 1.3074712643678161, "loss_full_dim": 0.31522855162620544, "loss_main": 0.6463280916213989, "loss_parscale": 0.65625, "loss_sub_dim": 0.33109956979751587, "loss_vclub": 0.0010528564453125, "parscale_sim": 0.98828125, "step": 1365 }, { "epoch": 1.3084291187739463, "grad_norm": 7.255568027496338, "learning_rate": 1.6684210526315792e-06, "loss": 0.6463, "step": 1366 }, { "epoch": 1.3084291187739463, "loss_full_dim": 0.30649468302726746, "loss_main": 0.6252375841140747, "loss_parscale": 0.6171875, "loss_sub_dim": 0.31874293088912964, "loss_vclub": 0.00092315673828125, "parscale_sim": 0.984375, "step": 1366 }, { "epoch": 1.3093869731800767, "grad_norm": 6.584646224975586, "learning_rate": 1.6657894736842106e-06, "loss": 0.6252, "step": 1367 }, { "epoch": 1.3093869731800767, "loss_full_dim": 0.3024881184101105, "loss_main": 0.621546745300293, "loss_parscale": 0.6328125, "loss_sub_dim": 0.3190586268901825, "loss_vclub": 0.000957489013671875, "parscale_sim": 0.984375, "step": 1367 }, { "epoch": 1.3103448275862069, "grad_norm": 13.679372787475586, "learning_rate": 1.6631578947368424e-06, "loss": 0.6215, "step": 1368 }, { "epoch": 1.3103448275862069, "loss_full_dim": 0.2936478853225708, "loss_main": 0.6008739471435547, "loss_parscale": 0.60546875, "loss_sub_dim": 0.3072260916233063, "loss_vclub": 0.0009307861328125, "parscale_sim": 0.984375, "step": 1368 }, { "epoch": 1.3113026819923372, "grad_norm": 6.726417541503906, "learning_rate": 1.6605263157894738e-06, "loss": 0.6009, "step": 1369 }, { "epoch": 1.3113026819923372, "loss_full_dim": 0.2371179163455963, "loss_main": 0.48659634590148926, "loss_parscale": 0.490234375, "loss_sub_dim": 0.24947841465473175, "loss_vclub": 0.000835418701171875, "parscale_sim": 0.98046875, "step": 1369 }, { "epoch": 1.3122605363984674, "grad_norm": 7.782942295074463, "learning_rate": 1.6578947368421053e-06, "loss": 0.4866, "step": 1370 }, { "epoch": 1.3122605363984674, "loss_full_dim": 0.3094536364078522, "loss_main": 0.6329210996627808, "loss_parscale": 0.6484375, "loss_sub_dim": 0.3234674334526062, "loss_vclub": 0.0012054443359375, "parscale_sim": 0.984375, "step": 1370 }, { "epoch": 1.3132183908045976, "grad_norm": 12.27284049987793, "learning_rate": 1.655263157894737e-06, "loss": 0.6329, "step": 1371 }, { "epoch": 1.3132183908045976, "loss_full_dim": 0.2685330808162689, "loss_main": 0.5488983392715454, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2803652882575989, "loss_vclub": 0.0012359619140625, "parscale_sim": 0.98828125, "step": 1371 }, { "epoch": 1.314176245210728, "grad_norm": 138.82997131347656, "learning_rate": 1.6526315789473685e-06, "loss": 0.5489, "step": 1372 }, { "epoch": 1.314176245210728, "loss_full_dim": 0.25459128618240356, "loss_main": 0.5204910039901733, "loss_parscale": 0.5234375, "loss_sub_dim": 0.2658997178077698, "loss_vclub": 0.0008544921875, "parscale_sim": 0.98828125, "step": 1372 }, { "epoch": 1.3151340996168583, "grad_norm": 7.027474403381348, "learning_rate": 1.6500000000000003e-06, "loss": 0.5205, "step": 1373 }, { "epoch": 1.3151340996168583, "loss_full_dim": 0.258207768201828, "loss_main": 0.5309864282608032, "loss_parscale": 0.53125, "loss_sub_dim": 0.27277863025665283, "loss_vclub": 0.00118255615234375, "parscale_sim": 0.98828125, "step": 1373 }, { "epoch": 1.3160919540229885, "grad_norm": 5.351786136627197, "learning_rate": 1.6473684210526317e-06, "loss": 0.531, "step": 1374 }, { "epoch": 1.3160919540229885, "loss_full_dim": 0.21989157795906067, "loss_main": 0.45063138008117676, "loss_parscale": 0.44921875, "loss_sub_dim": 0.2307398021221161, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.984375, "step": 1374 }, { "epoch": 1.3170498084291187, "grad_norm": 5.830430030822754, "learning_rate": 1.6447368421052635e-06, "loss": 0.4506, "step": 1375 }, { "epoch": 1.3170498084291187, "loss_full_dim": 0.2873387336730957, "loss_main": 0.5877772569656372, "loss_parscale": 0.5859375, "loss_sub_dim": 0.3004385232925415, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.96484375, "step": 1375 }, { "epoch": 1.318007662835249, "grad_norm": 10.228461265563965, "learning_rate": 1.6421052631578948e-06, "loss": 0.5878, "step": 1376 }, { "epoch": 1.318007662835249, "loss_full_dim": 0.31058773398399353, "loss_main": 0.6340237855911255, "loss_parscale": 0.625, "loss_sub_dim": 0.32343602180480957, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.98828125, "step": 1376 }, { "epoch": 1.3189655172413794, "grad_norm": 11.185540199279785, "learning_rate": 1.6394736842105264e-06, "loss": 0.634, "step": 1377 }, { "epoch": 1.3189655172413794, "loss_full_dim": 0.25797131657600403, "loss_main": 0.5303477048873901, "loss_parscale": 0.53515625, "loss_sub_dim": 0.2723763585090637, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.984375, "step": 1377 }, { "epoch": 1.3199233716475096, "grad_norm": 8.769050598144531, "learning_rate": 1.636842105263158e-06, "loss": 0.5303, "step": 1378 }, { "epoch": 1.3199233716475096, "loss_full_dim": 0.273465096950531, "loss_main": 0.5596481561660767, "loss_parscale": 0.56640625, "loss_sub_dim": 0.28618302941322327, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.984375, "step": 1378 }, { "epoch": 1.3208812260536398, "grad_norm": 4.97776985168457, "learning_rate": 1.6342105263157896e-06, "loss": 0.5596, "step": 1379 }, { "epoch": 1.3208812260536398, "loss_full_dim": 0.2503149211406708, "loss_main": 0.5148190259933472, "loss_parscale": 0.51953125, "loss_sub_dim": 0.264504075050354, "loss_vclub": 0.00089263916015625, "parscale_sim": 0.984375, "step": 1379 }, { "epoch": 1.3218390804597702, "grad_norm": 6.7666497230529785, "learning_rate": 1.6315789473684212e-06, "loss": 0.5148, "step": 1380 }, { "epoch": 1.3218390804597702, "loss_full_dim": 0.3172864317893982, "loss_main": 0.649596631526947, "loss_parscale": 0.66015625, "loss_sub_dim": 0.33231019973754883, "loss_vclub": 0.000843048095703125, "parscale_sim": 0.98046875, "step": 1380 }, { "epoch": 1.3227969348659003, "grad_norm": 60.22551727294922, "learning_rate": 1.6289473684210527e-06, "loss": 0.6496, "step": 1381 }, { "epoch": 1.3227969348659003, "loss_full_dim": 0.21017149090766907, "loss_main": 0.432351291179657, "loss_parscale": 0.439453125, "loss_sub_dim": 0.2221798151731491, "loss_vclub": 0.0009765625, "parscale_sim": 0.98828125, "step": 1381 }, { "epoch": 1.3237547892720307, "grad_norm": 4.190472602844238, "learning_rate": 1.6263157894736845e-06, "loss": 0.4324, "step": 1382 }, { "epoch": 1.3237547892720307, "loss_full_dim": 0.29878994822502136, "loss_main": 0.6129499673843384, "loss_parscale": 0.60546875, "loss_sub_dim": 0.3141600489616394, "loss_vclub": 0.000965118408203125, "parscale_sim": 0.984375, "step": 1382 }, { "epoch": 1.3247126436781609, "grad_norm": 6.0117998123168945, "learning_rate": 1.623684210526316e-06, "loss": 0.6129, "step": 1383 }, { "epoch": 1.3247126436781609, "loss_full_dim": 0.3298760950565338, "loss_main": 0.6757357120513916, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3458596467971802, "loss_vclub": 0.000850677490234375, "parscale_sim": 0.98046875, "step": 1383 }, { "epoch": 1.3256704980842913, "grad_norm": 9.467016220092773, "learning_rate": 1.6210526315789473e-06, "loss": 0.6757, "step": 1384 }, { "epoch": 1.3256704980842913, "loss_full_dim": 0.28850314021110535, "loss_main": 0.5884602665901184, "loss_parscale": 0.59375, "loss_sub_dim": 0.29995712637901306, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.984375, "step": 1384 }, { "epoch": 1.3266283524904214, "grad_norm": 20.35039520263672, "learning_rate": 1.618421052631579e-06, "loss": 0.5885, "step": 1385 }, { "epoch": 1.3266283524904214, "loss_full_dim": 0.25311753153800964, "loss_main": 0.5184799432754517, "loss_parscale": 0.515625, "loss_sub_dim": 0.26536238193511963, "loss_vclub": 0.000904083251953125, "parscale_sim": 0.98046875, "step": 1385 }, { "epoch": 1.3275862068965516, "grad_norm": 9.704333305358887, "learning_rate": 1.6157894736842106e-06, "loss": 0.5185, "step": 1386 }, { "epoch": 1.3275862068965516, "loss_full_dim": 0.26658716797828674, "loss_main": 0.5442478060722351, "loss_parscale": 0.54296875, "loss_sub_dim": 0.27766063809394836, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.984375, "step": 1386 }, { "epoch": 1.328544061302682, "grad_norm": 5.668735027313232, "learning_rate": 1.6131578947368422e-06, "loss": 0.5442, "step": 1387 }, { "epoch": 1.328544061302682, "loss_full_dim": 0.28328394889831543, "loss_main": 0.5785335302352905, "loss_parscale": 0.5859375, "loss_sub_dim": 0.2952495515346527, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.98046875, "step": 1387 }, { "epoch": 1.3295019157088124, "grad_norm": 6.452946186065674, "learning_rate": 1.6105263157894738e-06, "loss": 0.5785, "step": 1388 }, { "epoch": 1.3295019157088124, "loss_full_dim": 0.2981138229370117, "loss_main": 0.6109448671340942, "loss_parscale": 0.609375, "loss_sub_dim": 0.3128310441970825, "loss_vclub": 0.000885009765625, "parscale_sim": 0.98046875, "step": 1388 }, { "epoch": 1.3304597701149425, "grad_norm": 7.81870698928833, "learning_rate": 1.6078947368421056e-06, "loss": 0.6109, "step": 1389 }, { "epoch": 1.3304597701149425, "loss_full_dim": 0.26138296723365784, "loss_main": 0.5353184938430786, "loss_parscale": 0.5390625, "loss_sub_dim": 0.27393555641174316, "loss_vclub": 0.0009765625, "parscale_sim": 0.984375, "step": 1389 }, { "epoch": 1.3314176245210727, "grad_norm": 18.784730911254883, "learning_rate": 1.605263157894737e-06, "loss": 0.5353, "step": 1390 }, { "epoch": 1.3314176245210727, "loss_full_dim": 0.2697572410106659, "loss_main": 0.5535567998886108, "loss_parscale": 0.546875, "loss_sub_dim": 0.28379958868026733, "loss_vclub": 0.000942230224609375, "parscale_sim": 0.97265625, "step": 1390 }, { "epoch": 1.332375478927203, "grad_norm": 16.503398895263672, "learning_rate": 1.6026315789473683e-06, "loss": 0.5536, "step": 1391 }, { "epoch": 1.332375478927203, "loss_full_dim": 0.24890229105949402, "loss_main": 0.5103331804275513, "loss_parscale": 0.51171875, "loss_sub_dim": 0.26143091917037964, "loss_vclub": 0.00121307373046875, "parscale_sim": 0.98828125, "step": 1391 }, { "epoch": 1.3333333333333333, "grad_norm": 5.324005603790283, "learning_rate": 1.6000000000000001e-06, "loss": 0.5103, "step": 1392 }, { "epoch": 1.3333333333333333, "loss_full_dim": 0.27816900610923767, "loss_main": 0.5677748918533325, "loss_parscale": 0.5703125, "loss_sub_dim": 0.28960591554641724, "loss_vclub": 0.000911712646484375, "parscale_sim": 0.984375, "step": 1392 }, { "epoch": 1.3342911877394636, "grad_norm": 49.14399719238281, "learning_rate": 1.5973684210526317e-06, "loss": 0.5678, "step": 1393 }, { "epoch": 1.3342911877394636, "loss_full_dim": 0.2882636785507202, "loss_main": 0.5896452069282532, "loss_parscale": 0.59375, "loss_sub_dim": 0.30138152837753296, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98046875, "step": 1393 }, { "epoch": 1.3352490421455938, "grad_norm": 116.46202087402344, "learning_rate": 1.5947368421052633e-06, "loss": 0.5896, "step": 1394 }, { "epoch": 1.3352490421455938, "loss_full_dim": 0.3069973886013031, "loss_main": 0.6272177696228027, "loss_parscale": 0.62890625, "loss_sub_dim": 0.32022035121917725, "loss_vclub": 0.0008544921875, "parscale_sim": 0.98046875, "step": 1394 }, { "epoch": 1.3362068965517242, "grad_norm": 5.997342586517334, "learning_rate": 1.5921052631578949e-06, "loss": 0.6272, "step": 1395 }, { "epoch": 1.3362068965517242, "loss_full_dim": 0.2795782685279846, "loss_main": 0.5724254846572876, "loss_parscale": 0.578125, "loss_sub_dim": 0.292847216129303, "loss_vclub": 0.000885009765625, "parscale_sim": 0.9765625, "step": 1395 }, { "epoch": 1.3371647509578544, "grad_norm": 7.522037029266357, "learning_rate": 1.5894736842105265e-06, "loss": 0.5724, "step": 1396 }, { "epoch": 1.3371647509578544, "loss_full_dim": 0.25958728790283203, "loss_main": 0.5312973260879517, "loss_parscale": 0.5390625, "loss_sub_dim": 0.27171000838279724, "loss_vclub": 0.00103759765625, "parscale_sim": 0.98828125, "step": 1396 }, { "epoch": 1.3381226053639848, "grad_norm": 5.68756103515625, "learning_rate": 1.586842105263158e-06, "loss": 0.5313, "step": 1397 }, { "epoch": 1.3381226053639848, "loss_full_dim": 0.2992541193962097, "loss_main": 0.6126993298530579, "loss_parscale": 0.6171875, "loss_sub_dim": 0.31344521045684814, "loss_vclub": 0.000682830810546875, "parscale_sim": 0.984375, "step": 1397 }, { "epoch": 1.339080459770115, "grad_norm": 5.715951919555664, "learning_rate": 1.5842105263157894e-06, "loss": 0.6127, "step": 1398 }, { "epoch": 1.339080459770115, "loss_full_dim": 0.28944799304008484, "loss_main": 0.5912874341011047, "loss_parscale": 0.59765625, "loss_sub_dim": 0.3018394410610199, "loss_vclub": 0.000942230224609375, "parscale_sim": 0.98828125, "step": 1398 }, { "epoch": 1.3400383141762453, "grad_norm": 4.310550689697266, "learning_rate": 1.5815789473684212e-06, "loss": 0.5913, "step": 1399 }, { "epoch": 1.3400383141762453, "loss_full_dim": 0.24784140288829803, "loss_main": 0.5067541599273682, "loss_parscale": 0.51171875, "loss_sub_dim": 0.25891274213790894, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.9765625, "step": 1399 }, { "epoch": 1.3409961685823755, "grad_norm": 7.360272407531738, "learning_rate": 1.5789473684210526e-06, "loss": 0.5068, "step": 1400 }, { "epoch": 1.3409961685823755, "loss_full_dim": 0.3330940008163452, "loss_main": 0.6767317056655884, "loss_parscale": 0.67578125, "loss_sub_dim": 0.34363770484924316, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.984375, "step": 1400 }, { "epoch": 1.3419540229885056, "grad_norm": 7.922904968261719, "learning_rate": 1.5763157894736844e-06, "loss": 0.6767, "step": 1401 }, { "epoch": 1.3419540229885056, "loss_full_dim": 0.26061204075813293, "loss_main": 0.5336577892303467, "loss_parscale": 0.53125, "loss_sub_dim": 0.27304574847221375, "loss_vclub": 0.00084686279296875, "parscale_sim": 0.98828125, "step": 1401 }, { "epoch": 1.342911877394636, "grad_norm": 8.50568962097168, "learning_rate": 1.573684210526316e-06, "loss": 0.5337, "step": 1402 }, { "epoch": 1.342911877394636, "loss_full_dim": 0.3215365409851074, "loss_main": 0.6584418416023254, "loss_parscale": 0.65625, "loss_sub_dim": 0.336905300617218, "loss_vclub": 0.000946044921875, "parscale_sim": 0.984375, "step": 1402 }, { "epoch": 1.3438697318007664, "grad_norm": 68.45893859863281, "learning_rate": 1.5710526315789475e-06, "loss": 0.6584, "step": 1403 }, { "epoch": 1.3438697318007664, "loss_full_dim": 0.3068680465221405, "loss_main": 0.6251933574676514, "loss_parscale": 0.6171875, "loss_sub_dim": 0.31832534074783325, "loss_vclub": 0.000885009765625, "parscale_sim": 0.984375, "step": 1403 }, { "epoch": 1.3448275862068966, "grad_norm": 10.348437309265137, "learning_rate": 1.5684210526315791e-06, "loss": 0.6252, "step": 1404 }, { "epoch": 1.3448275862068966, "loss_full_dim": 0.27559924125671387, "loss_main": 0.5637133121490479, "loss_parscale": 0.5703125, "loss_sub_dim": 0.288114070892334, "loss_vclub": 0.000823974609375, "parscale_sim": 0.984375, "step": 1404 }, { "epoch": 1.3457854406130267, "grad_norm": 7.098781108856201, "learning_rate": 1.5657894736842105e-06, "loss": 0.5637, "step": 1405 }, { "epoch": 1.3457854406130267, "loss_full_dim": 0.2647462487220764, "loss_main": 0.5430606007575989, "loss_parscale": 0.5546875, "loss_sub_dim": 0.27831435203552246, "loss_vclub": 0.00103759765625, "parscale_sim": 0.984375, "step": 1405 }, { "epoch": 1.3467432950191571, "grad_norm": 9.702272415161133, "learning_rate": 1.5631578947368423e-06, "loss": 0.5431, "step": 1406 }, { "epoch": 1.3467432950191571, "loss_full_dim": 0.25064679980278015, "loss_main": 0.5138700008392334, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26322317123413086, "loss_vclub": 0.0009765625, "parscale_sim": 0.98046875, "step": 1406 }, { "epoch": 1.3477011494252873, "grad_norm": 5.545770645141602, "learning_rate": 1.5605263157894737e-06, "loss": 0.5139, "step": 1407 }, { "epoch": 1.3477011494252873, "loss_full_dim": 0.3019847571849823, "loss_main": 0.6150964498519897, "loss_parscale": 0.62109375, "loss_sub_dim": 0.31311172246932983, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.98046875, "step": 1407 }, { "epoch": 1.3486590038314177, "grad_norm": 6.2636823654174805, "learning_rate": 1.5578947368421054e-06, "loss": 0.6151, "step": 1408 }, { "epoch": 1.3486590038314177, "loss_full_dim": 0.2601128816604614, "loss_main": 0.5333535075187683, "loss_parscale": 0.546875, "loss_sub_dim": 0.2732406258583069, "loss_vclub": 0.000926971435546875, "parscale_sim": 0.98828125, "step": 1408 }, { "epoch": 1.3496168582375478, "grad_norm": 8.161312103271484, "learning_rate": 1.5552631578947368e-06, "loss": 0.5334, "step": 1409 }, { "epoch": 1.3496168582375478, "loss_full_dim": 0.31044802069664, "loss_main": 0.6359328031539917, "loss_parscale": 0.64453125, "loss_sub_dim": 0.3254847526550293, "loss_vclub": 0.000762939453125, "parscale_sim": 0.9765625, "step": 1409 }, { "epoch": 1.3505747126436782, "grad_norm": 5.573994159698486, "learning_rate": 1.5526315789473686e-06, "loss": 0.6359, "step": 1410 }, { "epoch": 1.3505747126436782, "loss_full_dim": 0.2448892891407013, "loss_main": 0.5011206865310669, "loss_parscale": 0.50390625, "loss_sub_dim": 0.256231427192688, "loss_vclub": 0.00106048583984375, "parscale_sim": 0.98828125, "step": 1410 }, { "epoch": 1.3515325670498084, "grad_norm": 5.251748561859131, "learning_rate": 1.5500000000000002e-06, "loss": 0.5011, "step": 1411 }, { "epoch": 1.3515325670498084, "loss_full_dim": 0.2681443691253662, "loss_main": 0.5488423109054565, "loss_parscale": 0.55859375, "loss_sub_dim": 0.28069794178009033, "loss_vclub": 0.00093841552734375, "parscale_sim": 0.984375, "step": 1411 }, { "epoch": 1.3524904214559386, "grad_norm": 17.743867874145508, "learning_rate": 1.5473684210526316e-06, "loss": 0.5488, "step": 1412 }, { "epoch": 1.3524904214559386, "loss_full_dim": 0.26781490445137024, "loss_main": 0.5475293397903442, "loss_parscale": 0.55078125, "loss_sub_dim": 0.2797144055366516, "loss_vclub": 0.001007080078125, "parscale_sim": 0.984375, "step": 1412 }, { "epoch": 1.353448275862069, "grad_norm": 8.322724342346191, "learning_rate": 1.5447368421052634e-06, "loss": 0.5475, "step": 1413 }, { "epoch": 1.353448275862069, "loss_full_dim": 0.2596686780452728, "loss_main": 0.5324405431747437, "loss_parscale": 0.5390625, "loss_sub_dim": 0.27277183532714844, "loss_vclub": 0.000762939453125, "parscale_sim": 0.984375, "step": 1413 }, { "epoch": 1.3544061302681993, "grad_norm": 4.292129039764404, "learning_rate": 1.5421052631578947e-06, "loss": 0.5324, "step": 1414 }, { "epoch": 1.3544061302681993, "loss_full_dim": 0.21005436778068542, "loss_main": 0.4306059181690216, "loss_parscale": 0.4375, "loss_sub_dim": 0.22055155038833618, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.984375, "step": 1414 }, { "epoch": 1.3553639846743295, "grad_norm": 7.047054767608643, "learning_rate": 1.5394736842105265e-06, "loss": 0.4306, "step": 1415 }, { "epoch": 1.3553639846743295, "loss_full_dim": 0.2678617835044861, "loss_main": 0.5472501516342163, "loss_parscale": 0.5390625, "loss_sub_dim": 0.2793883681297302, "loss_vclub": 0.001129150390625, "parscale_sim": 0.98828125, "step": 1415 }, { "epoch": 1.3563218390804597, "grad_norm": 5.5407891273498535, "learning_rate": 1.5368421052631579e-06, "loss": 0.5473, "step": 1416 }, { "epoch": 1.3563218390804597, "loss_full_dim": 0.26800256967544556, "loss_main": 0.546289324760437, "loss_parscale": 0.55859375, "loss_sub_dim": 0.27828675508499146, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.984375, "step": 1416 }, { "epoch": 1.35727969348659, "grad_norm": 6.60573148727417, "learning_rate": 1.5342105263157897e-06, "loss": 0.5463, "step": 1417 }, { "epoch": 1.35727969348659, "loss_full_dim": 0.328622430562973, "loss_main": 0.6692323684692383, "loss_parscale": 0.66796875, "loss_sub_dim": 0.34060990810394287, "loss_vclub": 0.00091552734375, "parscale_sim": 0.984375, "step": 1417 }, { "epoch": 1.3582375478927204, "grad_norm": 7.481311798095703, "learning_rate": 1.5315789473684213e-06, "loss": 0.6692, "step": 1418 }, { "epoch": 1.3582375478927204, "loss_full_dim": 0.28026261925697327, "loss_main": 0.5724532604217529, "loss_parscale": 0.56640625, "loss_sub_dim": 0.29219067096710205, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.98046875, "step": 1418 }, { "epoch": 1.3591954022988506, "grad_norm": 8.104726791381836, "learning_rate": 1.5289473684210526e-06, "loss": 0.5725, "step": 1419 }, { "epoch": 1.3591954022988506, "loss_full_dim": 0.2864629626274109, "loss_main": 0.5836079120635986, "loss_parscale": 0.59375, "loss_sub_dim": 0.29714494943618774, "loss_vclub": 0.0011138916015625, "parscale_sim": 0.984375, "step": 1419 }, { "epoch": 1.3601532567049808, "grad_norm": 7.007654190063477, "learning_rate": 1.5263157894736844e-06, "loss": 0.5836, "step": 1420 }, { "epoch": 1.3601532567049808, "loss_full_dim": 0.28261664509773254, "loss_main": 0.5778884887695312, "loss_parscale": 0.578125, "loss_sub_dim": 0.2952718734741211, "loss_vclub": 0.000789642333984375, "parscale_sim": 0.984375, "step": 1420 }, { "epoch": 1.3611111111111112, "grad_norm": 7.774996757507324, "learning_rate": 1.5236842105263158e-06, "loss": 0.5779, "step": 1421 }, { "epoch": 1.3611111111111112, "loss_full_dim": 0.2942121922969818, "loss_main": 0.6023902893066406, "loss_parscale": 0.6015625, "loss_sub_dim": 0.3081781268119812, "loss_vclub": 0.00104522705078125, "parscale_sim": 0.98828125, "step": 1421 }, { "epoch": 1.3620689655172413, "grad_norm": 6.127841949462891, "learning_rate": 1.5210526315789476e-06, "loss": 0.6024, "step": 1422 }, { "epoch": 1.3620689655172413, "loss_full_dim": 0.2468608170747757, "loss_main": 0.5060372352600098, "loss_parscale": 0.5078125, "loss_sub_dim": 0.2591764032840729, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.98828125, "step": 1422 }, { "epoch": 1.3630268199233717, "grad_norm": 7.915132999420166, "learning_rate": 1.518421052631579e-06, "loss": 0.506, "step": 1423 }, { "epoch": 1.3630268199233717, "loss_full_dim": 0.3316683769226074, "loss_main": 0.6772264242172241, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3455580472946167, "loss_vclub": 0.000911712646484375, "parscale_sim": 0.98828125, "step": 1423 }, { "epoch": 1.3639846743295019, "grad_norm": 6.910118103027344, "learning_rate": 1.5157894736842108e-06, "loss": 0.6772, "step": 1424 }, { "epoch": 1.3639846743295019, "loss_full_dim": 0.32953375577926636, "loss_main": 0.671528697013855, "loss_parscale": 0.671875, "loss_sub_dim": 0.34199491143226624, "loss_vclub": 0.00099945068359375, "parscale_sim": 0.98828125, "step": 1424 }, { "epoch": 1.3649425287356323, "grad_norm": 6.610849380493164, "learning_rate": 1.5131578947368421e-06, "loss": 0.6715, "step": 1425 }, { "epoch": 1.3649425287356323, "loss_full_dim": 0.3078840672969818, "loss_main": 0.6280884742736816, "loss_parscale": 0.6328125, "loss_sub_dim": 0.32020437717437744, "loss_vclub": 0.0010528564453125, "parscale_sim": 0.984375, "step": 1425 }, { "epoch": 1.3659003831417624, "grad_norm": 9.053065299987793, "learning_rate": 1.5105263157894737e-06, "loss": 0.6281, "step": 1426 }, { "epoch": 1.3659003831417624, "loss_full_dim": 0.26077723503112793, "loss_main": 0.5326447486877441, "loss_parscale": 0.5390625, "loss_sub_dim": 0.2718675136566162, "loss_vclub": 0.00084686279296875, "parscale_sim": 0.984375, "step": 1426 }, { "epoch": 1.3668582375478926, "grad_norm": 8.62873649597168, "learning_rate": 1.5078947368421055e-06, "loss": 0.5326, "step": 1427 }, { "epoch": 1.3668582375478926, "loss_full_dim": 0.2652833163738251, "loss_main": 0.541610836982727, "loss_parscale": 0.546875, "loss_sub_dim": 0.27632755041122437, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.984375, "step": 1427 }, { "epoch": 1.367816091954023, "grad_norm": 4.588911056518555, "learning_rate": 1.5052631578947369e-06, "loss": 0.5416, "step": 1428 }, { "epoch": 1.367816091954023, "loss_full_dim": 0.2513919770717621, "loss_main": 0.514276385307312, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26288437843322754, "loss_vclub": 0.00103759765625, "parscale_sim": 0.98046875, "step": 1428 }, { "epoch": 1.3687739463601534, "grad_norm": 8.470575332641602, "learning_rate": 1.5026315789473687e-06, "loss": 0.5143, "step": 1429 }, { "epoch": 1.3687739463601534, "loss_full_dim": 0.259309321641922, "loss_main": 0.5292825698852539, "loss_parscale": 0.53125, "loss_sub_dim": 0.2699732780456543, "loss_vclub": 0.00072479248046875, "parscale_sim": 0.98828125, "step": 1429 }, { "epoch": 1.3697318007662835, "grad_norm": 8.213982582092285, "learning_rate": 1.5e-06, "loss": 0.5293, "step": 1430 }, { "epoch": 1.3697318007662835, "loss_full_dim": 0.2752333879470825, "loss_main": 0.5616605281829834, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2864271402359009, "loss_vclub": 0.000774383544921875, "parscale_sim": 0.98046875, "step": 1430 }, { "epoch": 1.3706896551724137, "grad_norm": 7.089951038360596, "learning_rate": 1.4973684210526318e-06, "loss": 0.5617, "step": 1431 }, { "epoch": 1.3706896551724137, "loss_full_dim": 0.3035776615142822, "loss_main": 0.6200872659683228, "loss_parscale": 0.6328125, "loss_sub_dim": 0.3165096044540405, "loss_vclub": 0.0009613037109375, "parscale_sim": 0.984375, "step": 1431 }, { "epoch": 1.371647509578544, "grad_norm": 9.369475364685059, "learning_rate": 1.4947368421052632e-06, "loss": 0.6201, "step": 1432 }, { "epoch": 1.371647509578544, "loss_full_dim": 0.2865648865699768, "loss_main": 0.5849059820175171, "loss_parscale": 0.5859375, "loss_sub_dim": 0.2983410656452179, "loss_vclub": 0.000911712646484375, "parscale_sim": 0.98828125, "step": 1432 }, { "epoch": 1.3726053639846743, "grad_norm": 8.337563514709473, "learning_rate": 1.4921052631578948e-06, "loss": 0.5849, "step": 1433 }, { "epoch": 1.3726053639846743, "loss_full_dim": 0.23998737335205078, "loss_main": 0.49382656812667847, "loss_parscale": 0.48828125, "loss_sub_dim": 0.2538391947746277, "loss_vclub": 0.000911712646484375, "parscale_sim": 0.9609375, "step": 1433 }, { "epoch": 1.3735632183908046, "grad_norm": 6.613793849945068, "learning_rate": 1.4894736842105264e-06, "loss": 0.4938, "step": 1434 }, { "epoch": 1.3735632183908046, "loss_full_dim": 0.22732439637184143, "loss_main": 0.46627938747406006, "loss_parscale": 0.46875, "loss_sub_dim": 0.23895500600337982, "loss_vclub": 0.0009613037109375, "parscale_sim": 0.984375, "step": 1434 }, { "epoch": 1.3745210727969348, "grad_norm": 7.078230857849121, "learning_rate": 1.486842105263158e-06, "loss": 0.4663, "step": 1435 }, { "epoch": 1.3745210727969348, "loss_full_dim": 0.31242093443870544, "loss_main": 0.6379152536392212, "loss_parscale": 0.64453125, "loss_sub_dim": 0.32549434900283813, "loss_vclub": 0.000926971435546875, "parscale_sim": 0.98046875, "step": 1435 }, { "epoch": 1.3754789272030652, "grad_norm": 7.053311824798584, "learning_rate": 1.4842105263157897e-06, "loss": 0.6379, "step": 1436 }, { "epoch": 1.3754789272030652, "loss_full_dim": 0.2595037519931793, "loss_main": 0.5297878980636597, "loss_parscale": 0.5390625, "loss_sub_dim": 0.27028417587280273, "loss_vclub": 0.000957489013671875, "parscale_sim": 0.98828125, "step": 1436 }, { "epoch": 1.3764367816091954, "grad_norm": 7.638769626617432, "learning_rate": 1.4815789473684211e-06, "loss": 0.5298, "step": 1437 }, { "epoch": 1.3764367816091954, "loss_full_dim": 0.3242509365081787, "loss_main": 0.6619527339935303, "loss_parscale": 0.66015625, "loss_sub_dim": 0.33770179748535156, "loss_vclub": 0.00091552734375, "parscale_sim": 0.984375, "step": 1437 }, { "epoch": 1.3773946360153257, "grad_norm": 8.022269248962402, "learning_rate": 1.478947368421053e-06, "loss": 0.662, "step": 1438 }, { "epoch": 1.3773946360153257, "loss_full_dim": 0.3254317343235016, "loss_main": 0.664404034614563, "loss_parscale": 0.6640625, "loss_sub_dim": 0.3389723300933838, "loss_vclub": 0.000766754150390625, "parscale_sim": 0.98046875, "step": 1438 }, { "epoch": 1.378352490421456, "grad_norm": 8.837288856506348, "learning_rate": 1.4763157894736843e-06, "loss": 0.6644, "step": 1439 }, { "epoch": 1.378352490421456, "loss_full_dim": 0.2861782908439636, "loss_main": 0.5864044427871704, "loss_parscale": 0.59375, "loss_sub_dim": 0.3002261519432068, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.98828125, "step": 1439 }, { "epoch": 1.3793103448275863, "grad_norm": 9.61581039428711, "learning_rate": 1.4736842105263159e-06, "loss": 0.5864, "step": 1440 }, { "epoch": 1.3793103448275863, "loss_full_dim": 0.27857762575149536, "loss_main": 0.5733732581138611, "loss_parscale": 0.58203125, "loss_sub_dim": 0.2947956323623657, "loss_vclub": 0.000885009765625, "parscale_sim": 0.984375, "step": 1440 }, { "epoch": 1.3802681992337165, "grad_norm": 5.374157428741455, "learning_rate": 1.4710526315789474e-06, "loss": 0.5734, "step": 1441 }, { "epoch": 1.3802681992337165, "loss_full_dim": 0.2425311803817749, "loss_main": 0.4965578317642212, "loss_parscale": 0.49609375, "loss_sub_dim": 0.2540266513824463, "loss_vclub": 0.00102996826171875, "parscale_sim": 0.98828125, "step": 1441 }, { "epoch": 1.3812260536398466, "grad_norm": 7.167741298675537, "learning_rate": 1.468421052631579e-06, "loss": 0.4966, "step": 1442 }, { "epoch": 1.3812260536398466, "loss_full_dim": 0.24236677587032318, "loss_main": 0.4966493844985962, "loss_parscale": 0.5, "loss_sub_dim": 0.2542826235294342, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.9765625, "step": 1442 }, { "epoch": 1.382183908045977, "grad_norm": 7.459336757659912, "learning_rate": 1.4657894736842106e-06, "loss": 0.4966, "step": 1443 }, { "epoch": 1.382183908045977, "loss_full_dim": 0.2197326421737671, "loss_main": 0.4485311508178711, "loss_parscale": 0.45703125, "loss_sub_dim": 0.228798508644104, "loss_vclub": 0.00099945068359375, "parscale_sim": 0.98046875, "step": 1443 }, { "epoch": 1.3831417624521074, "grad_norm": 5.488800525665283, "learning_rate": 1.4631578947368422e-06, "loss": 0.4485, "step": 1444 }, { "epoch": 1.3831417624521074, "loss_full_dim": 0.23315317928791046, "loss_main": 0.47714805603027344, "loss_parscale": 0.48046875, "loss_sub_dim": 0.24399487674236298, "loss_vclub": 0.000812530517578125, "parscale_sim": 0.984375, "step": 1444 }, { "epoch": 1.3840996168582376, "grad_norm": 8.004014015197754, "learning_rate": 1.460526315789474e-06, "loss": 0.4771, "step": 1445 }, { "epoch": 1.3840996168582376, "loss_full_dim": 0.27729532122612, "loss_main": 0.5671855211257935, "loss_parscale": 0.5703125, "loss_sub_dim": 0.28989022970199585, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.984375, "step": 1445 }, { "epoch": 1.3850574712643677, "grad_norm": 5.091665744781494, "learning_rate": 1.4578947368421053e-06, "loss": 0.5672, "step": 1446 }, { "epoch": 1.3850574712643677, "loss_full_dim": 0.2982071042060852, "loss_main": 0.6116952896118164, "loss_parscale": 0.62109375, "loss_sub_dim": 0.3134881556034088, "loss_vclub": 0.00116729736328125, "parscale_sim": 0.98828125, "step": 1446 }, { "epoch": 1.3860153256704981, "grad_norm": 6.97014045715332, "learning_rate": 1.4552631578947371e-06, "loss": 0.6117, "step": 1447 }, { "epoch": 1.3860153256704981, "loss_full_dim": 0.25122496485710144, "loss_main": 0.5156627893447876, "loss_parscale": 0.515625, "loss_sub_dim": 0.26443779468536377, "loss_vclub": 0.0010986328125, "parscale_sim": 0.984375, "step": 1447 }, { "epoch": 1.3869731800766283, "grad_norm": 3.1241614818573, "learning_rate": 1.4526315789473685e-06, "loss": 0.5157, "step": 1448 }, { "epoch": 1.3869731800766283, "loss_full_dim": 0.2580334544181824, "loss_main": 0.526891827583313, "loss_parscale": 0.5234375, "loss_sub_dim": 0.2688583731651306, "loss_vclub": 0.00074005126953125, "parscale_sim": 0.984375, "step": 1448 }, { "epoch": 1.3879310344827587, "grad_norm": 6.620814800262451, "learning_rate": 1.45e-06, "loss": 0.5269, "step": 1449 }, { "epoch": 1.3879310344827587, "loss_full_dim": 0.29191461205482483, "loss_main": 0.5964596271514893, "loss_parscale": 0.6015625, "loss_sub_dim": 0.3045450448989868, "loss_vclub": 0.00115966796875, "parscale_sim": 0.98046875, "step": 1449 }, { "epoch": 1.3888888888888888, "grad_norm": 10.294377326965332, "learning_rate": 1.4473684210526317e-06, "loss": 0.5965, "step": 1450 }, { "epoch": 1.3888888888888888, "loss_full_dim": 0.2957574725151062, "loss_main": 0.6049352884292603, "loss_parscale": 0.6015625, "loss_sub_dim": 0.30917781591415405, "loss_vclub": 0.000835418701171875, "parscale_sim": 0.98046875, "step": 1450 }, { "epoch": 1.3898467432950192, "grad_norm": 13.936260223388672, "learning_rate": 1.4447368421052633e-06, "loss": 0.6049, "step": 1451 }, { "epoch": 1.3898467432950192, "loss_full_dim": 0.30174171924591064, "loss_main": 0.6168468594551086, "loss_parscale": 0.61328125, "loss_sub_dim": 0.315105140209198, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.98046875, "step": 1451 }, { "epoch": 1.3908045977011494, "grad_norm": 8.148275375366211, "learning_rate": 1.442105263157895e-06, "loss": 0.6168, "step": 1452 }, { "epoch": 1.3908045977011494, "loss_full_dim": 0.3230585753917694, "loss_main": 0.6604815721511841, "loss_parscale": 0.6640625, "loss_sub_dim": 0.3374229669570923, "loss_vclub": 0.0008544921875, "parscale_sim": 0.984375, "step": 1452 }, { "epoch": 1.3917624521072796, "grad_norm": 8.453217506408691, "learning_rate": 1.4394736842105264e-06, "loss": 0.6605, "step": 1453 }, { "epoch": 1.3917624521072796, "loss_full_dim": 0.306484192609787, "loss_main": 0.6254726648330688, "loss_parscale": 0.640625, "loss_sub_dim": 0.31898850202560425, "loss_vclub": 0.00096893310546875, "parscale_sim": 0.984375, "step": 1453 }, { "epoch": 1.39272030651341, "grad_norm": 5.750580787658691, "learning_rate": 1.4368421052631582e-06, "loss": 0.6255, "step": 1454 }, { "epoch": 1.39272030651341, "loss_full_dim": 0.2634110152721405, "loss_main": 0.5398517847061157, "loss_parscale": 0.5390625, "loss_sub_dim": 0.27644073963165283, "loss_vclub": 0.00091552734375, "parscale_sim": 0.9765625, "step": 1454 }, { "epoch": 1.3936781609195403, "grad_norm": 6.283159255981445, "learning_rate": 1.4342105263157896e-06, "loss": 0.5399, "step": 1455 }, { "epoch": 1.3936781609195403, "loss_full_dim": 0.2542641758918762, "loss_main": 0.5204920768737793, "loss_parscale": 0.515625, "loss_sub_dim": 0.2662279009819031, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.98828125, "step": 1455 }, { "epoch": 1.3946360153256705, "grad_norm": 6.926137447357178, "learning_rate": 1.4315789473684212e-06, "loss": 0.5205, "step": 1456 }, { "epoch": 1.3946360153256705, "loss_full_dim": 0.33790823817253113, "loss_main": 0.6883993148803711, "loss_parscale": 0.6796875, "loss_sub_dim": 0.3504910469055176, "loss_vclub": 0.0010223388671875, "parscale_sim": 0.984375, "step": 1456 }, { "epoch": 1.3955938697318007, "grad_norm": 7.689052104949951, "learning_rate": 1.4289473684210527e-06, "loss": 0.6884, "step": 1457 }, { "epoch": 1.3955938697318007, "loss_full_dim": 0.2621385455131531, "loss_main": 0.5384857058525085, "loss_parscale": 0.54296875, "loss_sub_dim": 0.27634716033935547, "loss_vclub": 0.00102996826171875, "parscale_sim": 0.9765625, "step": 1457 }, { "epoch": 1.396551724137931, "grad_norm": 7.121740341186523, "learning_rate": 1.4263157894736843e-06, "loss": 0.5385, "step": 1458 }, { "epoch": 1.396551724137931, "loss_full_dim": 0.2846355140209198, "loss_main": 0.580682635307312, "loss_parscale": 0.5859375, "loss_sub_dim": 0.2960470914840698, "loss_vclub": 0.0009765625, "parscale_sim": 0.984375, "step": 1458 }, { "epoch": 1.3975095785440614, "grad_norm": 8.154653549194336, "learning_rate": 1.423684210526316e-06, "loss": 0.5807, "step": 1459 }, { "epoch": 1.3975095785440614, "loss_full_dim": 0.26376858353614807, "loss_main": 0.5387492179870605, "loss_parscale": 0.546875, "loss_sub_dim": 0.2749806046485901, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.984375, "step": 1459 }, { "epoch": 1.3984674329501916, "grad_norm": 5.934379577636719, "learning_rate": 1.4210526315789475e-06, "loss": 0.5387, "step": 1460 }, { "epoch": 1.3984674329501916, "loss_full_dim": 0.2675784230232239, "loss_main": 0.5477228760719299, "loss_parscale": 0.55078125, "loss_sub_dim": 0.28014445304870605, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.984375, "step": 1460 }, { "epoch": 1.3994252873563218, "grad_norm": 7.359752655029297, "learning_rate": 1.4184210526315793e-06, "loss": 0.5477, "step": 1461 }, { "epoch": 1.3994252873563218, "loss_full_dim": 0.3156362473964691, "loss_main": 0.642650842666626, "loss_parscale": 0.6484375, "loss_sub_dim": 0.32701462507247925, "loss_vclub": 0.00107574462890625, "parscale_sim": 0.984375, "step": 1461 }, { "epoch": 1.4003831417624522, "grad_norm": 6.922682762145996, "learning_rate": 1.4157894736842107e-06, "loss": 0.6427, "step": 1462 }, { "epoch": 1.4003831417624522, "loss_full_dim": 0.3073871433734894, "loss_main": 0.6280912756919861, "loss_parscale": 0.6328125, "loss_sub_dim": 0.3207041323184967, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98828125, "step": 1462 }, { "epoch": 1.4013409961685823, "grad_norm": 6.743398189544678, "learning_rate": 1.413157894736842e-06, "loss": 0.6281, "step": 1463 }, { "epoch": 1.4013409961685823, "loss_full_dim": 0.22414742410182953, "loss_main": 0.46084314584732056, "loss_parscale": 0.46875, "loss_sub_dim": 0.23669573664665222, "loss_vclub": 0.001190185546875, "parscale_sim": 0.984375, "step": 1463 }, { "epoch": 1.4022988505747127, "grad_norm": 5.730963706970215, "learning_rate": 1.4105263157894738e-06, "loss": 0.4608, "step": 1464 }, { "epoch": 1.4022988505747127, "loss_full_dim": 0.28662970662117004, "loss_main": 0.585118293762207, "loss_parscale": 0.5859375, "loss_sub_dim": 0.2984886169433594, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.98046875, "step": 1464 }, { "epoch": 1.4032567049808429, "grad_norm": 6.718564987182617, "learning_rate": 1.4078947368421054e-06, "loss": 0.5851, "step": 1465 }, { "epoch": 1.4032567049808429, "loss_full_dim": 0.25508442521095276, "loss_main": 0.5202966928482056, "loss_parscale": 0.51953125, "loss_sub_dim": 0.2652122676372528, "loss_vclub": 0.00069427490234375, "parscale_sim": 0.98828125, "step": 1465 }, { "epoch": 1.4042145593869733, "grad_norm": 7.177119255065918, "learning_rate": 1.405263157894737e-06, "loss": 0.5203, "step": 1466 }, { "epoch": 1.4042145593869733, "loss_full_dim": 0.29322701692581177, "loss_main": 0.6011387705802917, "loss_parscale": 0.60546875, "loss_sub_dim": 0.30791175365448, "loss_vclub": 0.0009002685546875, "parscale_sim": 0.984375, "step": 1466 }, { "epoch": 1.4051724137931034, "grad_norm": 6.588516712188721, "learning_rate": 1.4026315789473686e-06, "loss": 0.6011, "step": 1467 }, { "epoch": 1.4051724137931034, "loss_full_dim": 0.2553558647632599, "loss_main": 0.5208282470703125, "loss_parscale": 0.53125, "loss_sub_dim": 0.2654723525047302, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.98046875, "step": 1467 }, { "epoch": 1.4061302681992336, "grad_norm": 4.383182525634766, "learning_rate": 1.4000000000000001e-06, "loss": 0.5208, "step": 1468 }, { "epoch": 1.4061302681992336, "loss_full_dim": 0.3099234104156494, "loss_main": 0.6325430870056152, "loss_parscale": 0.625, "loss_sub_dim": 0.32261964678764343, "loss_vclub": 0.0009613037109375, "parscale_sim": 0.9765625, "step": 1468 }, { "epoch": 1.407088122605364, "grad_norm": 38.75847244262695, "learning_rate": 1.3973684210526317e-06, "loss": 0.6325, "step": 1469 }, { "epoch": 1.407088122605364, "loss_full_dim": 0.32179588079452515, "loss_main": 0.6546512246131897, "loss_parscale": 0.6640625, "loss_sub_dim": 0.33285534381866455, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.98046875, "step": 1469 }, { "epoch": 1.4080459770114944, "grad_norm": 10.84862995147705, "learning_rate": 1.394736842105263e-06, "loss": 0.6547, "step": 1470 }, { "epoch": 1.4080459770114944, "loss_full_dim": 0.2994224727153778, "loss_main": 0.6100900173187256, "loss_parscale": 0.61328125, "loss_sub_dim": 0.31066757440567017, "loss_vclub": 0.000827789306640625, "parscale_sim": 0.9609375, "step": 1470 }, { "epoch": 1.4090038314176245, "grad_norm": 4.688477039337158, "learning_rate": 1.3921052631578949e-06, "loss": 0.6101, "step": 1471 }, { "epoch": 1.4090038314176245, "loss_full_dim": 0.32779261469841003, "loss_main": 0.6683168411254883, "loss_parscale": 0.66796875, "loss_sub_dim": 0.34052419662475586, "loss_vclub": 0.0009002685546875, "parscale_sim": 0.984375, "step": 1471 }, { "epoch": 1.4099616858237547, "grad_norm": 7.635920524597168, "learning_rate": 1.3894736842105263e-06, "loss": 0.6683, "step": 1472 }, { "epoch": 1.4099616858237547, "loss_full_dim": 0.26717475056648254, "loss_main": 0.5468679666519165, "loss_parscale": 0.5546875, "loss_sub_dim": 0.27969324588775635, "loss_vclub": 0.000972747802734375, "parscale_sim": 0.984375, "step": 1472 }, { "epoch": 1.410919540229885, "grad_norm": 6.119555950164795, "learning_rate": 1.386842105263158e-06, "loss": 0.5469, "step": 1473 }, { "epoch": 1.410919540229885, "loss_full_dim": 0.23932358622550964, "loss_main": 0.4872093200683594, "loss_parscale": 0.494140625, "loss_sub_dim": 0.24788571894168854, "loss_vclub": 0.0008544921875, "parscale_sim": 0.98046875, "step": 1473 }, { "epoch": 1.4118773946360152, "grad_norm": 6.9905619621276855, "learning_rate": 1.3842105263157896e-06, "loss": 0.4872, "step": 1474 }, { "epoch": 1.4118773946360152, "loss_full_dim": 0.30843424797058105, "loss_main": 0.6270670890808105, "loss_parscale": 0.625, "loss_sub_dim": 0.3186328411102295, "loss_vclub": 0.00092315673828125, "parscale_sim": 0.984375, "step": 1474 }, { "epoch": 1.4128352490421456, "grad_norm": 6.837610244750977, "learning_rate": 1.3815789473684212e-06, "loss": 0.6271, "step": 1475 }, { "epoch": 1.4128352490421456, "loss_full_dim": 0.27881932258605957, "loss_main": 0.5699028968811035, "loss_parscale": 0.57421875, "loss_sub_dim": 0.29108354449272156, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.98828125, "step": 1475 }, { "epoch": 1.4137931034482758, "grad_norm": 7.498022079467773, "learning_rate": 1.3789473684210528e-06, "loss": 0.5699, "step": 1476 }, { "epoch": 1.4137931034482758, "loss_full_dim": 0.2748173475265503, "loss_main": 0.5602736473083496, "loss_parscale": 0.5625, "loss_sub_dim": 0.2854562997817993, "loss_vclub": 0.000904083251953125, "parscale_sim": 0.98828125, "step": 1476 }, { "epoch": 1.4147509578544062, "grad_norm": 8.380925178527832, "learning_rate": 1.3763157894736842e-06, "loss": 0.5603, "step": 1477 }, { "epoch": 1.4147509578544062, "loss_full_dim": 0.30592775344848633, "loss_main": 0.6245980262756348, "loss_parscale": 0.6328125, "loss_sub_dim": 0.31867027282714844, "loss_vclub": 0.00107574462890625, "parscale_sim": 0.984375, "step": 1477 }, { "epoch": 1.4157088122605364, "grad_norm": 8.696072578430176, "learning_rate": 1.373684210526316e-06, "loss": 0.6246, "step": 1478 }, { "epoch": 1.4157088122605364, "loss_full_dim": 0.2649526596069336, "loss_main": 0.5413990020751953, "loss_parscale": 0.5390625, "loss_sub_dim": 0.2764463424682617, "loss_vclub": 0.001129150390625, "parscale_sim": 0.984375, "step": 1478 }, { "epoch": 1.4166666666666667, "grad_norm": 7.39325475692749, "learning_rate": 1.3710526315789473e-06, "loss": 0.5414, "step": 1479 }, { "epoch": 1.4166666666666667, "loss_full_dim": 0.3020321726799011, "loss_main": 0.6181992292404175, "loss_parscale": 0.62890625, "loss_sub_dim": 0.31616705656051636, "loss_vclub": 0.000942230224609375, "parscale_sim": 0.984375, "step": 1479 }, { "epoch": 1.417624521072797, "grad_norm": 9.418996810913086, "learning_rate": 1.3684210526315791e-06, "loss": 0.6182, "step": 1480 }, { "epoch": 1.417624521072797, "loss_full_dim": 0.2944619357585907, "loss_main": 0.6013553142547607, "loss_parscale": 0.6015625, "loss_sub_dim": 0.30689337849617004, "loss_vclub": 0.00104522705078125, "parscale_sim": 0.984375, "step": 1480 }, { "epoch": 1.4185823754789273, "grad_norm": 6.891793727874756, "learning_rate": 1.3657894736842107e-06, "loss": 0.6014, "step": 1481 }, { "epoch": 1.4185823754789273, "loss_full_dim": 0.3396337926387787, "loss_main": 0.695358157157898, "loss_parscale": 0.69140625, "loss_sub_dim": 0.3557243347167969, "loss_vclub": 0.000942230224609375, "parscale_sim": 0.98046875, "step": 1481 }, { "epoch": 1.4195402298850575, "grad_norm": 7.158185958862305, "learning_rate": 1.3631578947368423e-06, "loss": 0.6954, "step": 1482 }, { "epoch": 1.4195402298850575, "loss_full_dim": 0.2553328573703766, "loss_main": 0.521722674369812, "loss_parscale": 0.52734375, "loss_sub_dim": 0.26638978719711304, "loss_vclub": 0.00083160400390625, "parscale_sim": 0.98046875, "step": 1482 }, { "epoch": 1.4204980842911876, "grad_norm": 5.008781433105469, "learning_rate": 1.3605263157894739e-06, "loss": 0.5217, "step": 1483 }, { "epoch": 1.4204980842911876, "loss_full_dim": 0.3152264356613159, "loss_main": 0.6424081921577454, "loss_parscale": 0.640625, "loss_sub_dim": 0.32718175649642944, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.98828125, "step": 1483 }, { "epoch": 1.421455938697318, "grad_norm": 6.445954322814941, "learning_rate": 1.3578947368421052e-06, "loss": 0.6424, "step": 1484 }, { "epoch": 1.421455938697318, "loss_full_dim": 0.260742723941803, "loss_main": 0.5333617329597473, "loss_parscale": 0.5390625, "loss_sub_dim": 0.27261900901794434, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.98828125, "step": 1484 }, { "epoch": 1.4224137931034484, "grad_norm": 6.143900394439697, "learning_rate": 1.355263157894737e-06, "loss": 0.5334, "step": 1485 }, { "epoch": 1.4224137931034484, "loss_full_dim": 0.2978692650794983, "loss_main": 0.6073390245437622, "loss_parscale": 0.60546875, "loss_sub_dim": 0.3094697594642639, "loss_vclub": 0.0009307861328125, "parscale_sim": 0.984375, "step": 1485 }, { "epoch": 1.4233716475095786, "grad_norm": 7.927254676818848, "learning_rate": 1.3526315789473684e-06, "loss": 0.6073, "step": 1486 }, { "epoch": 1.4233716475095786, "loss_full_dim": 0.32299312949180603, "loss_main": 0.6586132049560547, "loss_parscale": 0.6640625, "loss_sub_dim": 0.33562010526657104, "loss_vclub": 0.0009765625, "parscale_sim": 0.98046875, "step": 1486 }, { "epoch": 1.4243295019157087, "grad_norm": 8.617494583129883, "learning_rate": 1.3500000000000002e-06, "loss": 0.6586, "step": 1487 }, { "epoch": 1.4243295019157087, "loss_full_dim": 0.30196696519851685, "loss_main": 0.6164339780807495, "loss_parscale": 0.609375, "loss_sub_dim": 0.3144669830799103, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.98046875, "step": 1487 }, { "epoch": 1.4252873563218391, "grad_norm": 6.047404766082764, "learning_rate": 1.3473684210526316e-06, "loss": 0.6164, "step": 1488 }, { "epoch": 1.4252873563218391, "loss_full_dim": 0.2832612991333008, "loss_main": 0.5792470574378967, "loss_parscale": 0.5859375, "loss_sub_dim": 0.29598575830459595, "loss_vclub": 0.0011138916015625, "parscale_sim": 0.984375, "step": 1488 }, { "epoch": 1.4262452107279693, "grad_norm": 6.2645416259765625, "learning_rate": 1.3447368421052634e-06, "loss": 0.5792, "step": 1489 }, { "epoch": 1.4262452107279693, "loss_full_dim": 0.26197922229766846, "loss_main": 0.5360660552978516, "loss_parscale": 0.5390625, "loss_sub_dim": 0.2740868031978607, "loss_vclub": 0.000823974609375, "parscale_sim": 0.984375, "step": 1489 }, { "epoch": 1.4272030651340997, "grad_norm": 7.484915256500244, "learning_rate": 1.342105263157895e-06, "loss": 0.5361, "step": 1490 }, { "epoch": 1.4272030651340997, "loss_full_dim": 0.26681283116340637, "loss_main": 0.5469280481338501, "loss_parscale": 0.55078125, "loss_sub_dim": 0.28011518716812134, "loss_vclub": 0.00109100341796875, "parscale_sim": 0.98046875, "step": 1490 }, { "epoch": 1.4281609195402298, "grad_norm": 4.6334757804870605, "learning_rate": 1.3394736842105263e-06, "loss": 0.5469, "step": 1491 }, { "epoch": 1.4281609195402298, "loss_full_dim": 0.29488152265548706, "loss_main": 0.6005038619041443, "loss_parscale": 0.609375, "loss_sub_dim": 0.3056223392486572, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.98828125, "step": 1491 }, { "epoch": 1.4291187739463602, "grad_norm": 8.596287727355957, "learning_rate": 1.3368421052631581e-06, "loss": 0.6005, "step": 1492 }, { "epoch": 1.4291187739463602, "loss_full_dim": 0.23419758677482605, "loss_main": 0.4795033931732178, "loss_parscale": 0.48046875, "loss_sub_dim": 0.24530580639839172, "loss_vclub": 0.0010986328125, "parscale_sim": 0.984375, "step": 1492 }, { "epoch": 1.4300766283524904, "grad_norm": 8.110608100891113, "learning_rate": 1.3342105263157895e-06, "loss": 0.4795, "step": 1493 }, { "epoch": 1.4300766283524904, "loss_full_dim": 0.30550646781921387, "loss_main": 0.6247362494468689, "loss_parscale": 0.62890625, "loss_sub_dim": 0.31922978162765503, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.98828125, "step": 1493 }, { "epoch": 1.4310344827586206, "grad_norm": 7.922787189483643, "learning_rate": 1.3315789473684213e-06, "loss": 0.6247, "step": 1494 }, { "epoch": 1.4310344827586206, "loss_full_dim": 0.2673156261444092, "loss_main": 0.5461773872375488, "loss_parscale": 0.55078125, "loss_sub_dim": 0.27886176109313965, "loss_vclub": 0.00096893310546875, "parscale_sim": 0.984375, "step": 1494 }, { "epoch": 1.431992337164751, "grad_norm": 16.167774200439453, "learning_rate": 1.3289473684210526e-06, "loss": 0.5462, "step": 1495 }, { "epoch": 1.431992337164751, "loss_full_dim": 0.25967416167259216, "loss_main": 0.5313712358474731, "loss_parscale": 0.53125, "loss_sub_dim": 0.27169710397720337, "loss_vclub": 0.00093841552734375, "parscale_sim": 0.984375, "step": 1495 }, { "epoch": 1.4329501915708813, "grad_norm": 6.099295139312744, "learning_rate": 1.3263157894736844e-06, "loss": 0.5314, "step": 1496 }, { "epoch": 1.4329501915708813, "loss_full_dim": 0.24360954761505127, "loss_main": 0.4976204037666321, "loss_parscale": 0.5, "loss_sub_dim": 0.2540108561515808, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.98828125, "step": 1496 }, { "epoch": 1.4339080459770115, "grad_norm": 8.169200897216797, "learning_rate": 1.3236842105263158e-06, "loss": 0.4976, "step": 1497 }, { "epoch": 1.4339080459770115, "loss_full_dim": 0.24349112808704376, "loss_main": 0.49998611211776733, "loss_parscale": 0.50390625, "loss_sub_dim": 0.25649499893188477, "loss_vclub": 0.0009765625, "parscale_sim": 0.98828125, "step": 1497 }, { "epoch": 1.4348659003831417, "grad_norm": 7.213562488555908, "learning_rate": 1.3210526315789474e-06, "loss": 0.5, "step": 1498 }, { "epoch": 1.4348659003831417, "loss_full_dim": 0.2805010676383972, "loss_main": 0.5740911364555359, "loss_parscale": 0.578125, "loss_sub_dim": 0.29359006881713867, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.984375, "step": 1498 }, { "epoch": 1.435823754789272, "grad_norm": 8.854147911071777, "learning_rate": 1.3184210526315792e-06, "loss": 0.5741, "step": 1499 }, { "epoch": 1.435823754789272, "loss_full_dim": 0.3289738595485687, "loss_main": 0.6696485280990601, "loss_parscale": 0.68359375, "loss_sub_dim": 0.34067463874816895, "loss_vclub": 0.00084686279296875, "parscale_sim": 0.984375, "step": 1499 }, { "epoch": 1.4367816091954024, "grad_norm": 7.318841457366943, "learning_rate": 1.3157894736842106e-06, "loss": 0.6696, "step": 1500 }, { "epoch": 1.4367816091954024, "loss_full_dim": 0.287507563829422, "loss_main": 0.5878767967224121, "loss_parscale": 0.578125, "loss_sub_dim": 0.3003692626953125, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.984375, "step": 1500 }, { "epoch": 1.4377394636015326, "grad_norm": 7.048236846923828, "learning_rate": 1.3131578947368423e-06, "loss": 0.5879, "step": 1501 }, { "epoch": 1.4377394636015326, "loss_full_dim": 0.3296479880809784, "loss_main": 0.6726342439651489, "loss_parscale": 0.671875, "loss_sub_dim": 0.34298622608184814, "loss_vclub": 0.0008392333984375, "parscale_sim": 0.984375, "step": 1501 }, { "epoch": 1.4386973180076628, "grad_norm": 6.277939796447754, "learning_rate": 1.3105263157894737e-06, "loss": 0.6726, "step": 1502 }, { "epoch": 1.4386973180076628, "loss_full_dim": 0.24886251986026764, "loss_main": 0.5095056295394897, "loss_parscale": 0.5078125, "loss_sub_dim": 0.2606431245803833, "loss_vclub": 0.00079345703125, "parscale_sim": 0.984375, "step": 1502 }, { "epoch": 1.4396551724137931, "grad_norm": 5.635930061340332, "learning_rate": 1.3078947368421055e-06, "loss": 0.5095, "step": 1503 }, { "epoch": 1.4396551724137931, "loss_full_dim": 0.2869296669960022, "loss_main": 0.5857093334197998, "loss_parscale": 0.59375, "loss_sub_dim": 0.2987796664237976, "loss_vclub": 0.00096893310546875, "parscale_sim": 0.98828125, "step": 1503 }, { "epoch": 1.4406130268199233, "grad_norm": 34.323665618896484, "learning_rate": 1.3052631578947369e-06, "loss": 0.5857, "step": 1504 }, { "epoch": 1.4406130268199233, "loss_full_dim": 0.25524255633354187, "loss_main": 0.5209113359451294, "loss_parscale": 0.53515625, "loss_sub_dim": 0.2656687796115875, "loss_vclub": 0.000885009765625, "parscale_sim": 0.984375, "step": 1504 }, { "epoch": 1.4415708812260537, "grad_norm": 8.08777141571045, "learning_rate": 1.3026315789473685e-06, "loss": 0.5209, "step": 1505 }, { "epoch": 1.4415708812260537, "loss_full_dim": 0.2816554307937622, "loss_main": 0.5748637318611145, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2932083010673523, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.984375, "step": 1505 }, { "epoch": 1.4425287356321839, "grad_norm": 4.2961745262146, "learning_rate": 1.3e-06, "loss": 0.5749, "step": 1506 }, { "epoch": 1.4425287356321839, "loss_full_dim": 0.3097201883792877, "loss_main": 0.6317927241325378, "loss_parscale": 0.6328125, "loss_sub_dim": 0.3220725357532501, "loss_vclub": 0.000919342041015625, "parscale_sim": 0.9609375, "step": 1506 }, { "epoch": 1.4434865900383143, "grad_norm": 6.823925971984863, "learning_rate": 1.2973684210526316e-06, "loss": 0.6318, "step": 1507 }, { "epoch": 1.4434865900383143, "loss_full_dim": 0.22330324351787567, "loss_main": 0.4587704837322235, "loss_parscale": 0.46484375, "loss_sub_dim": 0.23546724021434784, "loss_vclub": 0.00104522705078125, "parscale_sim": 0.98828125, "step": 1507 }, { "epoch": 1.4444444444444444, "grad_norm": 5.374040126800537, "learning_rate": 1.2947368421052634e-06, "loss": 0.4588, "step": 1508 }, { "epoch": 1.4444444444444444, "loss_full_dim": 0.27110931277275085, "loss_main": 0.5558236837387085, "loss_parscale": 0.5546875, "loss_sub_dim": 0.28471437096595764, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.9765625, "step": 1508 }, { "epoch": 1.4454022988505746, "grad_norm": 8.247354507446289, "learning_rate": 1.2921052631578948e-06, "loss": 0.5558, "step": 1509 }, { "epoch": 1.4454022988505746, "loss_full_dim": 0.2116510272026062, "loss_main": 0.4349812865257263, "loss_parscale": 0.435546875, "loss_sub_dim": 0.22333025932312012, "loss_vclub": 0.000865936279296875, "parscale_sim": 0.984375, "step": 1509 }, { "epoch": 1.446360153256705, "grad_norm": 4.642245292663574, "learning_rate": 1.2894736842105266e-06, "loss": 0.435, "step": 1510 }, { "epoch": 1.446360153256705, "loss_full_dim": 0.272015243768692, "loss_main": 0.5548412799835205, "loss_parscale": 0.5625, "loss_sub_dim": 0.2828260064125061, "loss_vclub": 0.0010528564453125, "parscale_sim": 0.984375, "step": 1510 }, { "epoch": 1.4473180076628354, "grad_norm": 8.682985305786133, "learning_rate": 1.286842105263158e-06, "loss": 0.5548, "step": 1511 }, { "epoch": 1.4473180076628354, "loss_full_dim": 0.25278154015541077, "loss_main": 0.5182821750640869, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26550060510635376, "loss_vclub": 0.000911712646484375, "parscale_sim": 0.984375, "step": 1511 }, { "epoch": 1.4482758620689655, "grad_norm": 7.592095375061035, "learning_rate": 1.2842105263157895e-06, "loss": 0.5183, "step": 1512 }, { "epoch": 1.4482758620689655, "loss_full_dim": 0.2518763840198517, "loss_main": 0.5165605545043945, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26468414068222046, "loss_vclub": 0.000888824462890625, "parscale_sim": 0.984375, "step": 1512 }, { "epoch": 1.4492337164750957, "grad_norm": 7.938193321228027, "learning_rate": 1.2815789473684211e-06, "loss": 0.5166, "step": 1513 }, { "epoch": 1.4492337164750957, "loss_full_dim": 0.2955598533153534, "loss_main": 0.6026208400726318, "loss_parscale": 0.6015625, "loss_sub_dim": 0.30706101655960083, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.984375, "step": 1513 }, { "epoch": 1.450191570881226, "grad_norm": 8.8136568069458, "learning_rate": 1.2789473684210527e-06, "loss": 0.6026, "step": 1514 }, { "epoch": 1.450191570881226, "loss_full_dim": 0.2481529265642166, "loss_main": 0.5087924003601074, "loss_parscale": 0.51171875, "loss_sub_dim": 0.260639488697052, "loss_vclub": 0.00103759765625, "parscale_sim": 0.98828125, "step": 1514 }, { "epoch": 1.4511494252873562, "grad_norm": 4.876161575317383, "learning_rate": 1.2763157894736845e-06, "loss": 0.5088, "step": 1515 }, { "epoch": 1.4511494252873562, "loss_full_dim": 0.28185999393463135, "loss_main": 0.5768401026725769, "loss_parscale": 0.5703125, "loss_sub_dim": 0.29498010873794556, "loss_vclub": 0.000946044921875, "parscale_sim": 0.96875, "step": 1515 }, { "epoch": 1.4521072796934866, "grad_norm": 8.5045747756958, "learning_rate": 1.2736842105263159e-06, "loss": 0.5768, "step": 1516 }, { "epoch": 1.4521072796934866, "loss_full_dim": 0.2816425859928131, "loss_main": 0.5755710601806641, "loss_parscale": 0.57421875, "loss_sub_dim": 0.29392850399017334, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.984375, "step": 1516 }, { "epoch": 1.4530651340996168, "grad_norm": 9.201456069946289, "learning_rate": 1.2710526315789477e-06, "loss": 0.5756, "step": 1517 }, { "epoch": 1.4530651340996168, "loss_full_dim": 0.28290316462516785, "loss_main": 0.5766828060150146, "loss_parscale": 0.578125, "loss_sub_dim": 0.2937796711921692, "loss_vclub": 0.00096893310546875, "parscale_sim": 0.984375, "step": 1517 }, { "epoch": 1.4540229885057472, "grad_norm": 6.517994403839111, "learning_rate": 1.268421052631579e-06, "loss": 0.5767, "step": 1518 }, { "epoch": 1.4540229885057472, "loss_full_dim": 0.23997190594673157, "loss_main": 0.49339911341667175, "loss_parscale": 0.5078125, "loss_sub_dim": 0.2534272074699402, "loss_vclub": 0.00083160400390625, "parscale_sim": 0.98046875, "step": 1518 }, { "epoch": 1.4549808429118773, "grad_norm": 7.638847827911377, "learning_rate": 1.2657894736842106e-06, "loss": 0.4934, "step": 1519 }, { "epoch": 1.4549808429118773, "loss_full_dim": 0.3058415353298187, "loss_main": 0.62254399061203, "loss_parscale": 0.63671875, "loss_sub_dim": 0.3167024552822113, "loss_vclub": 0.000823974609375, "parscale_sim": 0.984375, "step": 1519 }, { "epoch": 1.4559386973180077, "grad_norm": 8.7429780960083, "learning_rate": 1.2631578947368422e-06, "loss": 0.6225, "step": 1520 }, { "epoch": 1.4559386973180077, "loss_full_dim": 0.274690181016922, "loss_main": 0.5604832172393799, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2857930660247803, "loss_vclub": 0.000881195068359375, "parscale_sim": 0.984375, "step": 1520 }, { "epoch": 1.456896551724138, "grad_norm": 5.984813690185547, "learning_rate": 1.2605263157894738e-06, "loss": 0.5605, "step": 1521 }, { "epoch": 1.456896551724138, "loss_full_dim": 0.257377564907074, "loss_main": 0.5251736640930176, "loss_parscale": 0.53125, "loss_sub_dim": 0.2677960991859436, "loss_vclub": 0.000946044921875, "parscale_sim": 0.9765625, "step": 1521 }, { "epoch": 1.4578544061302683, "grad_norm": 7.5676589012146, "learning_rate": 1.2578947368421054e-06, "loss": 0.5252, "step": 1522 }, { "epoch": 1.4578544061302683, "loss_full_dim": 0.26814764738082886, "loss_main": 0.5464603900909424, "loss_parscale": 0.546875, "loss_sub_dim": 0.2783127427101135, "loss_vclub": 0.000919342041015625, "parscale_sim": 0.984375, "step": 1522 }, { "epoch": 1.4588122605363985, "grad_norm": 7.1206464767456055, "learning_rate": 1.255263157894737e-06, "loss": 0.5465, "step": 1523 }, { "epoch": 1.4588122605363985, "loss_full_dim": 0.2786506116390228, "loss_main": 0.5694887638092041, "loss_parscale": 0.5703125, "loss_sub_dim": 0.29083818197250366, "loss_vclub": 0.00092315673828125, "parscale_sim": 0.98046875, "step": 1523 }, { "epoch": 1.4597701149425286, "grad_norm": 6.397876262664795, "learning_rate": 1.2526315789473687e-06, "loss": 0.5695, "step": 1524 }, { "epoch": 1.4597701149425286, "loss_full_dim": 0.23366975784301758, "loss_main": 0.478184312582016, "loss_parscale": 0.478515625, "loss_sub_dim": 0.2445145547389984, "loss_vclub": 0.000957489013671875, "parscale_sim": 0.984375, "step": 1524 }, { "epoch": 1.460727969348659, "grad_norm": 5.347677707672119, "learning_rate": 1.25e-06, "loss": 0.4782, "step": 1525 }, { "epoch": 1.460727969348659, "loss_full_dim": 0.2687762975692749, "loss_main": 0.5496650338172913, "loss_parscale": 0.546875, "loss_sub_dim": 0.28088873624801636, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.98046875, "step": 1525 }, { "epoch": 1.4616858237547894, "grad_norm": 6.684971332550049, "learning_rate": 1.2473684210526317e-06, "loss": 0.5497, "step": 1526 }, { "epoch": 1.4616858237547894, "loss_full_dim": 0.3208315670490265, "loss_main": 0.655392050743103, "loss_parscale": 0.65625, "loss_sub_dim": 0.33456048369407654, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.984375, "step": 1526 }, { "epoch": 1.4626436781609196, "grad_norm": 7.144434452056885, "learning_rate": 1.2447368421052633e-06, "loss": 0.6554, "step": 1527 }, { "epoch": 1.4626436781609196, "loss_full_dim": 0.30366969108581543, "loss_main": 0.6173754930496216, "loss_parscale": 0.6171875, "loss_sub_dim": 0.31370580196380615, "loss_vclub": 0.00103759765625, "parscale_sim": 0.984375, "step": 1527 }, { "epoch": 1.4636015325670497, "grad_norm": 7.340268135070801, "learning_rate": 1.2421052631578948e-06, "loss": 0.6174, "step": 1528 }, { "epoch": 1.4636015325670497, "loss_full_dim": 0.3015812337398529, "loss_main": 0.6135411262512207, "loss_parscale": 0.6171875, "loss_sub_dim": 0.3119598627090454, "loss_vclub": 0.00092315673828125, "parscale_sim": 0.984375, "step": 1528 }, { "epoch": 1.46455938697318, "grad_norm": 10.399184226989746, "learning_rate": 1.2394736842105264e-06, "loss": 0.6135, "step": 1529 }, { "epoch": 1.46455938697318, "loss_full_dim": 0.294243186712265, "loss_main": 0.6001113653182983, "loss_parscale": 0.60546875, "loss_sub_dim": 0.3058681786060333, "loss_vclub": 0.000896453857421875, "parscale_sim": 0.984375, "step": 1529 }, { "epoch": 1.4655172413793103, "grad_norm": 7.7450432777404785, "learning_rate": 1.236842105263158e-06, "loss": 0.6001, "step": 1530 }, { "epoch": 1.4655172413793103, "loss_full_dim": 0.2162518948316574, "loss_main": 0.4432108998298645, "loss_parscale": 0.45703125, "loss_sub_dim": 0.2269589900970459, "loss_vclub": 0.00089263916015625, "parscale_sim": 0.98828125, "step": 1530 }, { "epoch": 1.4664750957854407, "grad_norm": 7.039673328399658, "learning_rate": 1.2342105263157896e-06, "loss": 0.4432, "step": 1531 }, { "epoch": 1.4664750957854407, "loss_full_dim": 0.23247946798801422, "loss_main": 0.4744569659233093, "loss_parscale": 0.47265625, "loss_sub_dim": 0.2419774830341339, "loss_vclub": 0.001007080078125, "parscale_sim": 0.98828125, "step": 1531 }, { "epoch": 1.4674329501915708, "grad_norm": 8.252486228942871, "learning_rate": 1.2315789473684212e-06, "loss": 0.4745, "step": 1532 }, { "epoch": 1.4674329501915708, "loss_full_dim": 0.29890623688697815, "loss_main": 0.608609676361084, "loss_parscale": 0.6171875, "loss_sub_dim": 0.3097034692764282, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.9765625, "step": 1532 }, { "epoch": 1.4683908045977012, "grad_norm": 8.720959663391113, "learning_rate": 1.2289473684210528e-06, "loss": 0.6086, "step": 1533 }, { "epoch": 1.4683908045977012, "loss_full_dim": 0.259144127368927, "loss_main": 0.5299093127250671, "loss_parscale": 0.53125, "loss_sub_dim": 0.27076518535614014, "loss_vclub": 0.00081634521484375, "parscale_sim": 0.98828125, "step": 1533 }, { "epoch": 1.4693486590038314, "grad_norm": 6.237181186676025, "learning_rate": 1.2263157894736843e-06, "loss": 0.5299, "step": 1534 }, { "epoch": 1.4693486590038314, "loss_full_dim": 0.30565786361694336, "loss_main": 0.6246397495269775, "loss_parscale": 0.63671875, "loss_sub_dim": 0.3189818859100342, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.9765625, "step": 1534 }, { "epoch": 1.4703065134099618, "grad_norm": 8.427042961120605, "learning_rate": 1.223684210526316e-06, "loss": 0.6246, "step": 1535 }, { "epoch": 1.4703065134099618, "loss_full_dim": 0.2676406502723694, "loss_main": 0.5463684797286987, "loss_parscale": 0.5546875, "loss_sub_dim": 0.27872785925865173, "loss_vclub": 0.0009307861328125, "parscale_sim": 0.984375, "step": 1535 }, { "epoch": 1.471264367816092, "grad_norm": 5.077229022979736, "learning_rate": 1.2210526315789475e-06, "loss": 0.5464, "step": 1536 }, { "epoch": 1.471264367816092, "loss_full_dim": 0.27956831455230713, "loss_main": 0.5736624002456665, "loss_parscale": 0.57421875, "loss_sub_dim": 0.2940940856933594, "loss_vclub": 0.0010223388671875, "parscale_sim": 0.984375, "step": 1536 }, { "epoch": 1.4722222222222223, "grad_norm": 7.892132759094238, "learning_rate": 1.218421052631579e-06, "loss": 0.5737, "step": 1537 }, { "epoch": 1.4722222222222223, "loss_full_dim": 0.2711658477783203, "loss_main": 0.5519566535949707, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2807908058166504, "loss_vclub": 0.000762939453125, "parscale_sim": 0.984375, "step": 1537 }, { "epoch": 1.4731800766283525, "grad_norm": 9.02798080444336, "learning_rate": 1.2157894736842107e-06, "loss": 0.552, "step": 1538 }, { "epoch": 1.4731800766283525, "loss_full_dim": 0.28871357440948486, "loss_main": 0.5887461304664612, "loss_parscale": 0.58984375, "loss_sub_dim": 0.3000325560569763, "loss_vclub": 0.00102996826171875, "parscale_sim": 0.984375, "step": 1538 }, { "epoch": 1.4741379310344827, "grad_norm": 6.387866497039795, "learning_rate": 1.2131578947368422e-06, "loss": 0.5887, "step": 1539 }, { "epoch": 1.4741379310344827, "loss_full_dim": 0.3297213912010193, "loss_main": 0.6713694930076599, "loss_parscale": 0.65625, "loss_sub_dim": 0.3416481018066406, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.96484375, "step": 1539 }, { "epoch": 1.475095785440613, "grad_norm": 6.775327205657959, "learning_rate": 1.2105263157894738e-06, "loss": 0.6714, "step": 1540 }, { "epoch": 1.475095785440613, "loss_full_dim": 0.2920832633972168, "loss_main": 0.5984621047973633, "loss_parscale": 0.60546875, "loss_sub_dim": 0.3063788414001465, "loss_vclub": 0.000888824462890625, "parscale_sim": 0.984375, "step": 1540 }, { "epoch": 1.4760536398467434, "grad_norm": 7.750859260559082, "learning_rate": 1.2078947368421054e-06, "loss": 0.5985, "step": 1541 }, { "epoch": 1.4760536398467434, "loss_full_dim": 0.280681312084198, "loss_main": 0.5732887983322144, "loss_parscale": 0.5703125, "loss_sub_dim": 0.29260748624801636, "loss_vclub": 0.000972747802734375, "parscale_sim": 0.96484375, "step": 1541 }, { "epoch": 1.4770114942528736, "grad_norm": 6.712161064147949, "learning_rate": 1.205263157894737e-06, "loss": 0.5733, "step": 1542 }, { "epoch": 1.4770114942528736, "loss_full_dim": 0.2494150847196579, "loss_main": 0.5084672570228577, "loss_parscale": 0.5078125, "loss_sub_dim": 0.2590521574020386, "loss_vclub": 0.001007080078125, "parscale_sim": 0.984375, "step": 1542 }, { "epoch": 1.4779693486590038, "grad_norm": 6.276400089263916, "learning_rate": 1.2026315789473684e-06, "loss": 0.5085, "step": 1543 }, { "epoch": 1.4779693486590038, "loss_full_dim": 0.27058351039886475, "loss_main": 0.553539514541626, "loss_parscale": 0.5625, "loss_sub_dim": 0.28295600414276123, "loss_vclub": 0.00106048583984375, "parscale_sim": 0.984375, "step": 1543 }, { "epoch": 1.4789272030651341, "grad_norm": 6.2117438316345215, "learning_rate": 1.2000000000000002e-06, "loss": 0.5535, "step": 1544 }, { "epoch": 1.4789272030651341, "loss_full_dim": 0.2717023193836212, "loss_main": 0.5556834936141968, "loss_parscale": 0.5625, "loss_sub_dim": 0.28398117423057556, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.984375, "step": 1544 }, { "epoch": 1.4798850574712643, "grad_norm": 6.3779683113098145, "learning_rate": 1.1973684210526317e-06, "loss": 0.5557, "step": 1545 }, { "epoch": 1.4798850574712643, "loss_full_dim": 0.23468540608882904, "loss_main": 0.48183614015579224, "loss_parscale": 0.48046875, "loss_sub_dim": 0.2471507340669632, "loss_vclub": 0.00096893310546875, "parscale_sim": 0.984375, "step": 1545 }, { "epoch": 1.4808429118773947, "grad_norm": 8.92759895324707, "learning_rate": 1.1947368421052633e-06, "loss": 0.4818, "step": 1546 }, { "epoch": 1.4808429118773947, "loss_full_dim": 0.26549750566482544, "loss_main": 0.5421966314315796, "loss_parscale": 0.546875, "loss_sub_dim": 0.27669912576675415, "loss_vclub": 0.001007080078125, "parscale_sim": 0.984375, "step": 1546 }, { "epoch": 1.4818007662835249, "grad_norm": 4.760114669799805, "learning_rate": 1.192105263157895e-06, "loss": 0.5422, "step": 1547 }, { "epoch": 1.4818007662835249, "loss_full_dim": 0.30371230840682983, "loss_main": 0.6183878779411316, "loss_parscale": 0.6171875, "loss_sub_dim": 0.31467556953430176, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.98828125, "step": 1547 }, { "epoch": 1.4827586206896552, "grad_norm": 5.9211106300354, "learning_rate": 1.1894736842105265e-06, "loss": 0.6184, "step": 1548 }, { "epoch": 1.4827586206896552, "loss_full_dim": 0.25933748483657837, "loss_main": 0.5301872491836548, "loss_parscale": 0.53515625, "loss_sub_dim": 0.2708497643470764, "loss_vclub": 0.00081634521484375, "parscale_sim": 0.98046875, "step": 1548 }, { "epoch": 1.4837164750957854, "grad_norm": 7.2861762046813965, "learning_rate": 1.186842105263158e-06, "loss": 0.5302, "step": 1549 }, { "epoch": 1.4837164750957854, "loss_full_dim": 0.2524327337741852, "loss_main": 0.5152053236961365, "loss_parscale": 0.515625, "loss_sub_dim": 0.2627725899219513, "loss_vclub": 0.00078582763671875, "parscale_sim": 0.98046875, "step": 1549 }, { "epoch": 1.4846743295019156, "grad_norm": 10.983405113220215, "learning_rate": 1.1842105263157894e-06, "loss": 0.5152, "step": 1550 }, { "epoch": 1.4846743295019156, "loss_full_dim": 0.2027130275964737, "loss_main": 0.41706550121307373, "loss_parscale": 0.41796875, "loss_sub_dim": 0.21435245871543884, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98046875, "step": 1550 }, { "epoch": 1.485632183908046, "grad_norm": 4.054431438446045, "learning_rate": 1.181578947368421e-06, "loss": 0.4171, "step": 1551 }, { "epoch": 1.485632183908046, "loss_full_dim": 0.29001927375793457, "loss_main": 0.589880108833313, "loss_parscale": 0.59375, "loss_sub_dim": 0.2998608350753784, "loss_vclub": 0.00106048583984375, "parscale_sim": 0.98828125, "step": 1551 }, { "epoch": 1.4865900383141764, "grad_norm": 7.120423793792725, "learning_rate": 1.1789473684210526e-06, "loss": 0.5899, "step": 1552 }, { "epoch": 1.4865900383141764, "loss_full_dim": 0.23596863448619843, "loss_main": 0.48258620500564575, "loss_parscale": 0.478515625, "loss_sub_dim": 0.24661757051944733, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.98046875, "step": 1552 }, { "epoch": 1.4875478927203065, "grad_norm": 5.959951400756836, "learning_rate": 1.1763157894736844e-06, "loss": 0.4826, "step": 1553 }, { "epoch": 1.4875478927203065, "loss_full_dim": 0.2280838042497635, "loss_main": 0.46731430292129517, "loss_parscale": 0.470703125, "loss_sub_dim": 0.23923051357269287, "loss_vclub": 0.000843048095703125, "parscale_sim": 0.98046875, "step": 1553 }, { "epoch": 1.4885057471264367, "grad_norm": 6.9847002029418945, "learning_rate": 1.173684210526316e-06, "loss": 0.4673, "step": 1554 }, { "epoch": 1.4885057471264367, "loss_full_dim": 0.2977452278137207, "loss_main": 0.6074285507202148, "loss_parscale": 0.609375, "loss_sub_dim": 0.30968335270881653, "loss_vclub": 0.00092315673828125, "parscale_sim": 0.984375, "step": 1554 }, { "epoch": 1.489463601532567, "grad_norm": 4.544293403625488, "learning_rate": 1.1710526315789476e-06, "loss": 0.6074, "step": 1555 }, { "epoch": 1.489463601532567, "loss_full_dim": 0.24296583235263824, "loss_main": 0.4954572916030884, "loss_parscale": 0.498046875, "loss_sub_dim": 0.25249144434928894, "loss_vclub": 0.0010986328125, "parscale_sim": 0.98828125, "step": 1555 }, { "epoch": 1.4904214559386972, "grad_norm": 6.624514579772949, "learning_rate": 1.1684210526315791e-06, "loss": 0.4955, "step": 1556 }, { "epoch": 1.4904214559386972, "loss_full_dim": 0.30470213294029236, "loss_main": 0.6221929788589478, "loss_parscale": 0.625, "loss_sub_dim": 0.3174908757209778, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.984375, "step": 1556 }, { "epoch": 1.4913793103448276, "grad_norm": 6.728792190551758, "learning_rate": 1.1657894736842105e-06, "loss": 0.6222, "step": 1557 }, { "epoch": 1.4913793103448276, "loss_full_dim": 0.2534218430519104, "loss_main": 0.5195683240890503, "loss_parscale": 0.53515625, "loss_sub_dim": 0.2661464810371399, "loss_vclub": 0.00096893310546875, "parscale_sim": 0.984375, "step": 1557 }, { "epoch": 1.4923371647509578, "grad_norm": 6.928586959838867, "learning_rate": 1.163157894736842e-06, "loss": 0.5196, "step": 1558 }, { "epoch": 1.4923371647509578, "loss_full_dim": 0.2371552288532257, "loss_main": 0.4858822822570801, "loss_parscale": 0.490234375, "loss_sub_dim": 0.24872705340385437, "loss_vclub": 0.00091552734375, "parscale_sim": 0.98828125, "step": 1558 }, { "epoch": 1.4932950191570882, "grad_norm": 6.7881622314453125, "learning_rate": 1.1605263157894737e-06, "loss": 0.4859, "step": 1559 }, { "epoch": 1.4932950191570882, "loss_full_dim": 0.23259171843528748, "loss_main": 0.47459474205970764, "loss_parscale": 0.47265625, "loss_sub_dim": 0.24200302362442017, "loss_vclub": 0.00081634521484375, "parscale_sim": 0.984375, "step": 1559 }, { "epoch": 1.4942528735632183, "grad_norm": 7.585178375244141, "learning_rate": 1.1578947368421053e-06, "loss": 0.4746, "step": 1560 }, { "epoch": 1.4942528735632183, "loss_full_dim": 0.276476114988327, "loss_main": 0.5650969743728638, "loss_parscale": 0.5703125, "loss_sub_dim": 0.28862088918685913, "loss_vclub": 0.000946044921875, "parscale_sim": 0.984375, "step": 1560 }, { "epoch": 1.4952107279693487, "grad_norm": 7.856417179107666, "learning_rate": 1.155263157894737e-06, "loss": 0.5651, "step": 1561 }, { "epoch": 1.4952107279693487, "loss_full_dim": 0.2599063813686371, "loss_main": 0.5323008298873901, "loss_parscale": 0.5390625, "loss_sub_dim": 0.27239444851875305, "loss_vclub": 0.000919342041015625, "parscale_sim": 0.984375, "step": 1561 }, { "epoch": 1.496168582375479, "grad_norm": 9.02015495300293, "learning_rate": 1.1526315789473686e-06, "loss": 0.5323, "step": 1562 }, { "epoch": 1.496168582375479, "loss_full_dim": 0.30725914239883423, "loss_main": 0.6284549832344055, "loss_parscale": 0.62890625, "loss_sub_dim": 0.3211958408355713, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.98828125, "step": 1562 }, { "epoch": 1.4971264367816093, "grad_norm": 9.47971248626709, "learning_rate": 1.1500000000000002e-06, "loss": 0.6285, "step": 1563 }, { "epoch": 1.4971264367816093, "loss_full_dim": 0.26974019408226013, "loss_main": 0.5529787540435791, "loss_parscale": 0.55078125, "loss_sub_dim": 0.28323858976364136, "loss_vclub": 0.000797271728515625, "parscale_sim": 0.98046875, "step": 1563 }, { "epoch": 1.4980842911877394, "grad_norm": 8.506958961486816, "learning_rate": 1.1473684210526316e-06, "loss": 0.553, "step": 1564 }, { "epoch": 1.4980842911877394, "loss_full_dim": 0.25857871770858765, "loss_main": 0.5283440947532654, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26976537704467773, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.984375, "step": 1564 }, { "epoch": 1.4990421455938696, "grad_norm": 7.485211372375488, "learning_rate": 1.1447368421052632e-06, "loss": 0.5283, "step": 1565 }, { "epoch": 1.4990421455938696, "loss_full_dim": 0.2564588487148285, "loss_main": 0.5235564112663269, "loss_parscale": 0.5234375, "loss_sub_dim": 0.2670975625514984, "loss_vclub": 0.000946044921875, "parscale_sim": 0.984375, "step": 1565 }, { "epoch": 1.5, "grad_norm": 6.1396284103393555, "learning_rate": 1.1421052631578947e-06, "loss": 0.5236, "step": 1566 }, { "epoch": 1.5, "loss_full_dim": 0.2790297865867615, "loss_main": 0.5706413388252258, "loss_parscale": 0.56640625, "loss_sub_dim": 0.29161155223846436, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.984375, "step": 1566 }, { "epoch": 1.5009578544061304, "grad_norm": 9.124783515930176, "learning_rate": 1.1394736842105263e-06, "loss": 0.5706, "step": 1567 }, { "epoch": 1.5009578544061304, "loss_full_dim": 0.2635965645313263, "loss_main": 0.5386325120925903, "loss_parscale": 0.546875, "loss_sub_dim": 0.27503594756126404, "loss_vclub": 0.000942230224609375, "parscale_sim": 0.98828125, "step": 1567 }, { "epoch": 1.5019157088122606, "grad_norm": 7.236045837402344, "learning_rate": 1.136842105263158e-06, "loss": 0.5386, "step": 1568 }, { "epoch": 1.5019157088122606, "loss_full_dim": 0.2641006112098694, "loss_main": 0.5388285517692566, "loss_parscale": 0.5390625, "loss_sub_dim": 0.2747279405593872, "loss_vclub": 0.000812530517578125, "parscale_sim": 0.98828125, "step": 1568 }, { "epoch": 1.5028735632183907, "grad_norm": 7.839972972869873, "learning_rate": 1.1342105263157895e-06, "loss": 0.5388, "step": 1569 }, { "epoch": 1.5028735632183907, "loss_full_dim": 0.2845177948474884, "loss_main": 0.5802520513534546, "loss_parscale": 0.5859375, "loss_sub_dim": 0.2957342863082886, "loss_vclub": 0.00099945068359375, "parscale_sim": 0.98828125, "step": 1569 }, { "epoch": 1.503831417624521, "grad_norm": 4.773136615753174, "learning_rate": 1.1315789473684213e-06, "loss": 0.5803, "step": 1570 }, { "epoch": 1.503831417624521, "loss_full_dim": 0.3266419768333435, "loss_main": 0.6681307554244995, "loss_parscale": 0.671875, "loss_sub_dim": 0.3414887487888336, "loss_vclub": 0.00072479248046875, "parscale_sim": 0.98046875, "step": 1570 }, { "epoch": 1.5047892720306515, "grad_norm": 9.4158353805542, "learning_rate": 1.1289473684210529e-06, "loss": 0.6681, "step": 1571 }, { "epoch": 1.5047892720306515, "loss_full_dim": 0.2679955065250397, "loss_main": 0.5461979508399963, "loss_parscale": 0.54296875, "loss_sub_dim": 0.27820244431495667, "loss_vclub": 0.000843048095703125, "parscale_sim": 0.984375, "step": 1571 }, { "epoch": 1.5057471264367817, "grad_norm": 5.798795700073242, "learning_rate": 1.1263157894736842e-06, "loss": 0.5462, "step": 1572 }, { "epoch": 1.5057471264367817, "loss_full_dim": 0.2591155469417572, "loss_main": 0.5280858278274536, "loss_parscale": 0.53515625, "loss_sub_dim": 0.2689702808856964, "loss_vclub": 0.000946044921875, "parscale_sim": 0.984375, "step": 1572 }, { "epoch": 1.5067049808429118, "grad_norm": 9.392311096191406, "learning_rate": 1.1236842105263158e-06, "loss": 0.5281, "step": 1573 }, { "epoch": 1.5067049808429118, "loss_full_dim": 0.2735786736011505, "loss_main": 0.5596981048583984, "loss_parscale": 0.5625, "loss_sub_dim": 0.28611940145492554, "loss_vclub": 0.00103759765625, "parscale_sim": 0.984375, "step": 1573 }, { "epoch": 1.5076628352490422, "grad_norm": 19.735437393188477, "learning_rate": 1.1210526315789474e-06, "loss": 0.5597, "step": 1574 }, { "epoch": 1.5076628352490422, "loss_full_dim": 0.24710938334465027, "loss_main": 0.5037733316421509, "loss_parscale": 0.5078125, "loss_sub_dim": 0.2566639184951782, "loss_vclub": 0.0010223388671875, "parscale_sim": 0.98046875, "step": 1574 }, { "epoch": 1.5086206896551724, "grad_norm": 6.7458696365356445, "learning_rate": 1.118421052631579e-06, "loss": 0.5038, "step": 1575 }, { "epoch": 1.5086206896551724, "loss_full_dim": 0.23704536259174347, "loss_main": 0.4864211678504944, "loss_parscale": 0.482421875, "loss_sub_dim": 0.24937579035758972, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.98828125, "step": 1575 }, { "epoch": 1.5095785440613025, "grad_norm": 6.34112024307251, "learning_rate": 1.1157894736842106e-06, "loss": 0.4864, "step": 1576 }, { "epoch": 1.5095785440613025, "loss_full_dim": 0.28337907791137695, "loss_main": 0.5786964297294617, "loss_parscale": 0.578125, "loss_sub_dim": 0.2953173518180847, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98046875, "step": 1576 }, { "epoch": 1.510536398467433, "grad_norm": 8.49710750579834, "learning_rate": 1.1131578947368421e-06, "loss": 0.5787, "step": 1577 }, { "epoch": 1.510536398467433, "loss_full_dim": 0.24742473661899567, "loss_main": 0.505791962146759, "loss_parscale": 0.5234375, "loss_sub_dim": 0.2583672106266022, "loss_vclub": 0.00106048583984375, "parscale_sim": 0.98828125, "step": 1577 }, { "epoch": 1.5114942528735633, "grad_norm": 8.188737869262695, "learning_rate": 1.110526315789474e-06, "loss": 0.5058, "step": 1578 }, { "epoch": 1.5114942528735633, "loss_full_dim": 0.25804299116134644, "loss_main": 0.5265523195266724, "loss_parscale": 0.52734375, "loss_sub_dim": 0.2685093581676483, "loss_vclub": 0.00092315673828125, "parscale_sim": 0.98046875, "step": 1578 }, { "epoch": 1.5124521072796935, "grad_norm": 4.510198593139648, "learning_rate": 1.1078947368421053e-06, "loss": 0.5266, "step": 1579 }, { "epoch": 1.5124521072796935, "loss_full_dim": 0.23181921243667603, "loss_main": 0.4761497974395752, "loss_parscale": 0.48046875, "loss_sub_dim": 0.24433059990406036, "loss_vclub": 0.0008544921875, "parscale_sim": 0.98046875, "step": 1579 }, { "epoch": 1.5134099616858236, "grad_norm": 6.469951629638672, "learning_rate": 1.1052631578947369e-06, "loss": 0.4761, "step": 1580 }, { "epoch": 1.5134099616858236, "loss_full_dim": 0.2433459609746933, "loss_main": 0.4980982542037964, "loss_parscale": 0.494140625, "loss_sub_dim": 0.2547522783279419, "loss_vclub": 0.0008392333984375, "parscale_sim": 0.98046875, "step": 1580 }, { "epoch": 1.514367816091954, "grad_norm": 10.283929824829102, "learning_rate": 1.1026315789473685e-06, "loss": 0.4981, "step": 1581 }, { "epoch": 1.514367816091954, "loss_full_dim": 0.3284716010093689, "loss_main": 0.6703755259513855, "loss_parscale": 0.66796875, "loss_sub_dim": 0.3419039249420166, "loss_vclub": 0.001068115234375, "parscale_sim": 0.96875, "step": 1581 }, { "epoch": 1.5153256704980844, "grad_norm": 9.125419616699219, "learning_rate": 1.1e-06, "loss": 0.6704, "step": 1582 }, { "epoch": 1.5153256704980844, "loss_full_dim": 0.24836961925029755, "loss_main": 0.5081508755683899, "loss_parscale": 0.50390625, "loss_sub_dim": 0.25978124141693115, "loss_vclub": 0.00106048583984375, "parscale_sim": 0.984375, "step": 1582 }, { "epoch": 1.5162835249042146, "grad_norm": 15.676124572753906, "learning_rate": 1.0973684210526316e-06, "loss": 0.5082, "step": 1583 }, { "epoch": 1.5162835249042146, "loss_full_dim": 0.2319272756576538, "loss_main": 0.47537505626678467, "loss_parscale": 0.478515625, "loss_sub_dim": 0.24344778060913086, "loss_vclub": 0.00079345703125, "parscale_sim": 0.984375, "step": 1583 }, { "epoch": 1.5172413793103448, "grad_norm": 7.495913028717041, "learning_rate": 1.0947368421052632e-06, "loss": 0.4754, "step": 1584 }, { "epoch": 1.5172413793103448, "loss_full_dim": 0.25196415185928345, "loss_main": 0.5168355107307434, "loss_parscale": 0.51953125, "loss_sub_dim": 0.26487135887145996, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.984375, "step": 1584 }, { "epoch": 1.5181992337164751, "grad_norm": 5.981796741485596, "learning_rate": 1.0921052631578948e-06, "loss": 0.5168, "step": 1585 }, { "epoch": 1.5181992337164751, "loss_full_dim": 0.27404290437698364, "loss_main": 0.5574386715888977, "loss_parscale": 0.5546875, "loss_sub_dim": 0.28339576721191406, "loss_vclub": 0.00067901611328125, "parscale_sim": 0.9765625, "step": 1585 }, { "epoch": 1.5191570881226055, "grad_norm": 6.641780853271484, "learning_rate": 1.0894736842105264e-06, "loss": 0.5574, "step": 1586 }, { "epoch": 1.5191570881226055, "loss_full_dim": 0.2821393609046936, "loss_main": 0.5760588645935059, "loss_parscale": 0.5703125, "loss_sub_dim": 0.29391950368881226, "loss_vclub": 0.000972747802734375, "parscale_sim": 0.98828125, "step": 1586 }, { "epoch": 1.5201149425287355, "grad_norm": 6.113681316375732, "learning_rate": 1.086842105263158e-06, "loss": 0.5761, "step": 1587 }, { "epoch": 1.5201149425287355, "loss_full_dim": 0.29272589087486267, "loss_main": 0.5977290868759155, "loss_parscale": 0.59375, "loss_sub_dim": 0.30500316619873047, "loss_vclub": 0.00093841552734375, "parscale_sim": 0.984375, "step": 1587 }, { "epoch": 1.5210727969348659, "grad_norm": 6.438180923461914, "learning_rate": 1.0842105263157895e-06, "loss": 0.5977, "step": 1588 }, { "epoch": 1.5210727969348659, "loss_full_dim": 0.28797340393066406, "loss_main": 0.5876954793930054, "loss_parscale": 0.58984375, "loss_sub_dim": 0.2997220456600189, "loss_vclub": 0.000946044921875, "parscale_sim": 0.984375, "step": 1588 }, { "epoch": 1.5220306513409962, "grad_norm": 6.340412139892578, "learning_rate": 1.0815789473684211e-06, "loss": 0.5877, "step": 1589 }, { "epoch": 1.5220306513409962, "loss_full_dim": 0.23166348040103912, "loss_main": 0.47335296869277954, "loss_parscale": 0.4765625, "loss_sub_dim": 0.24168947339057922, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.984375, "step": 1589 }, { "epoch": 1.5229885057471264, "grad_norm": 5.805327892303467, "learning_rate": 1.0789473684210527e-06, "loss": 0.4734, "step": 1590 }, { "epoch": 1.5229885057471264, "loss_full_dim": 0.2609327435493469, "loss_main": 0.5351004600524902, "loss_parscale": 0.53515625, "loss_sub_dim": 0.2741677165031433, "loss_vclub": 0.001007080078125, "parscale_sim": 0.984375, "step": 1590 }, { "epoch": 1.5239463601532566, "grad_norm": 8.8634614944458, "learning_rate": 1.0763157894736843e-06, "loss": 0.5351, "step": 1591 }, { "epoch": 1.5239463601532566, "loss_full_dim": 0.29366734623908997, "loss_main": 0.5994752645492554, "loss_parscale": 0.59765625, "loss_sub_dim": 0.305807888507843, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.984375, "step": 1591 }, { "epoch": 1.524904214559387, "grad_norm": 8.76005744934082, "learning_rate": 1.0736842105263159e-06, "loss": 0.5995, "step": 1592 }, { "epoch": 1.524904214559387, "loss_full_dim": 0.26979267597198486, "loss_main": 0.5509302616119385, "loss_parscale": 0.5546875, "loss_sub_dim": 0.281137615442276, "loss_vclub": 0.000972747802734375, "parscale_sim": 0.984375, "step": 1592 }, { "epoch": 1.5258620689655173, "grad_norm": 7.522891521453857, "learning_rate": 1.0710526315789475e-06, "loss": 0.5509, "step": 1593 }, { "epoch": 1.5258620689655173, "loss_full_dim": 0.3211836814880371, "loss_main": 0.6551686525344849, "loss_parscale": 0.65625, "loss_sub_dim": 0.33398497104644775, "loss_vclub": 0.000762939453125, "parscale_sim": 0.98828125, "step": 1593 }, { "epoch": 1.5268199233716475, "grad_norm": 9.30798625946045, "learning_rate": 1.068421052631579e-06, "loss": 0.6552, "step": 1594 }, { "epoch": 1.5268199233716475, "loss_full_dim": 0.31426653265953064, "loss_main": 0.6404658555984497, "loss_parscale": 0.640625, "loss_sub_dim": 0.32619932293891907, "loss_vclub": 0.00107574462890625, "parscale_sim": 0.98828125, "step": 1594 }, { "epoch": 1.5277777777777777, "grad_norm": 135.56375122070312, "learning_rate": 1.0657894736842106e-06, "loss": 0.6405, "step": 1595 }, { "epoch": 1.5277777777777777, "loss_full_dim": 0.2769826650619507, "loss_main": 0.5668060779571533, "loss_parscale": 0.578125, "loss_sub_dim": 0.28982341289520264, "loss_vclub": 0.001007080078125, "parscale_sim": 0.984375, "step": 1595 }, { "epoch": 1.528735632183908, "grad_norm": 6.873380661010742, "learning_rate": 1.0631578947368422e-06, "loss": 0.5668, "step": 1596 }, { "epoch": 1.528735632183908, "loss_full_dim": 0.2382703274488449, "loss_main": 0.4894460439682007, "loss_parscale": 0.49609375, "loss_sub_dim": 0.25117573142051697, "loss_vclub": 0.0006866455078125, "parscale_sim": 0.98046875, "step": 1596 }, { "epoch": 1.5296934865900385, "grad_norm": 6.693147659301758, "learning_rate": 1.0605263157894738e-06, "loss": 0.4894, "step": 1597 }, { "epoch": 1.5296934865900385, "loss_full_dim": 0.2954946458339691, "loss_main": 0.6028512716293335, "loss_parscale": 0.609375, "loss_sub_dim": 0.307356595993042, "loss_vclub": 0.00107574462890625, "parscale_sim": 0.98828125, "step": 1597 }, { "epoch": 1.5306513409961686, "grad_norm": 6.441985607147217, "learning_rate": 1.0578947368421054e-06, "loss": 0.6029, "step": 1598 }, { "epoch": 1.5306513409961686, "loss_full_dim": 0.30501699447631836, "loss_main": 0.6209715604782104, "loss_parscale": 0.6328125, "loss_sub_dim": 0.3159545660018921, "loss_vclub": 0.0009765625, "parscale_sim": 0.98828125, "step": 1598 }, { "epoch": 1.5316091954022988, "grad_norm": 6.305158615112305, "learning_rate": 1.055263157894737e-06, "loss": 0.621, "step": 1599 }, { "epoch": 1.5316091954022988, "loss_full_dim": 0.2742574214935303, "loss_main": 0.5595269799232483, "loss_parscale": 0.5625, "loss_sub_dim": 0.285269558429718, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.984375, "step": 1599 }, { "epoch": 1.5325670498084292, "grad_norm": 7.515499591827393, "learning_rate": 1.0526315789473685e-06, "loss": 0.5595, "step": 1600 }, { "epoch": 1.5325670498084292, "loss_full_dim": 0.3273540735244751, "loss_main": 0.6689017415046692, "loss_parscale": 0.67578125, "loss_sub_dim": 0.3415476679801941, "loss_vclub": 0.0010986328125, "parscale_sim": 0.984375, "step": 1600 }, { "epoch": 1.5335249042145593, "grad_norm": 5.724565505981445, "learning_rate": 1.0500000000000001e-06, "loss": 0.6689, "step": 1601 }, { "epoch": 1.5335249042145593, "loss_full_dim": 0.24053023755550385, "loss_main": 0.49288225173950195, "loss_parscale": 0.498046875, "loss_sub_dim": 0.2523519992828369, "loss_vclub": 0.00107574462890625, "parscale_sim": 0.984375, "step": 1601 }, { "epoch": 1.5344827586206895, "grad_norm": 7.5518479347229, "learning_rate": 1.0473684210526317e-06, "loss": 0.4929, "step": 1602 }, { "epoch": 1.5344827586206895, "loss_full_dim": 0.2625426948070526, "loss_main": 0.5375175476074219, "loss_parscale": 0.54296875, "loss_sub_dim": 0.2749748229980469, "loss_vclub": 0.00083160400390625, "parscale_sim": 0.984375, "step": 1602 }, { "epoch": 1.53544061302682, "grad_norm": 6.118851184844971, "learning_rate": 1.0447368421052633e-06, "loss": 0.5375, "step": 1603 }, { "epoch": 1.53544061302682, "loss_full_dim": 0.3220432996749878, "loss_main": 0.6596174240112305, "loss_parscale": 0.66015625, "loss_sub_dim": 0.3375740945339203, "loss_vclub": 0.000858306884765625, "parscale_sim": 0.97265625, "step": 1603 }, { "epoch": 1.5363984674329503, "grad_norm": 7.441565990447998, "learning_rate": 1.0421052631578949e-06, "loss": 0.6596, "step": 1604 }, { "epoch": 1.5363984674329503, "loss_full_dim": 0.26834213733673096, "loss_main": 0.546699583530426, "loss_parscale": 0.546875, "loss_sub_dim": 0.27835744619369507, "loss_vclub": 0.000904083251953125, "parscale_sim": 0.98046875, "step": 1604 }, { "epoch": 1.5373563218390804, "grad_norm": 13.06944465637207, "learning_rate": 1.0394736842105264e-06, "loss": 0.5467, "step": 1605 }, { "epoch": 1.5373563218390804, "loss_full_dim": 0.2817932665348053, "loss_main": 0.5740146636962891, "loss_parscale": 0.58203125, "loss_sub_dim": 0.2922213673591614, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.98046875, "step": 1605 }, { "epoch": 1.5383141762452106, "grad_norm": 7.185764312744141, "learning_rate": 1.036842105263158e-06, "loss": 0.574, "step": 1606 }, { "epoch": 1.5383141762452106, "loss_full_dim": 0.24811694025993347, "loss_main": 0.5075650215148926, "loss_parscale": 0.51953125, "loss_sub_dim": 0.2594481110572815, "loss_vclub": 0.00093841552734375, "parscale_sim": 0.98046875, "step": 1606 }, { "epoch": 1.539272030651341, "grad_norm": 111.8059310913086, "learning_rate": 1.0342105263157896e-06, "loss": 0.5076, "step": 1607 }, { "epoch": 1.539272030651341, "loss_full_dim": 0.3306986093521118, "loss_main": 0.673525869846344, "loss_parscale": 0.671875, "loss_sub_dim": 0.3428272604942322, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.98828125, "step": 1607 }, { "epoch": 1.5402298850574714, "grad_norm": 10.222908973693848, "learning_rate": 1.0315789473684212e-06, "loss": 0.6735, "step": 1608 }, { "epoch": 1.5402298850574714, "loss_full_dim": 0.25123757123947144, "loss_main": 0.513714075088501, "loss_parscale": 0.515625, "loss_sub_dim": 0.26247650384902954, "loss_vclub": 0.0009002685546875, "parscale_sim": 0.98828125, "step": 1608 }, { "epoch": 1.5411877394636015, "grad_norm": 7.883967399597168, "learning_rate": 1.0289473684210528e-06, "loss": 0.5137, "step": 1609 }, { "epoch": 1.5411877394636015, "loss_full_dim": 0.34097132086753845, "loss_main": 0.6940422058105469, "loss_parscale": 0.6875, "loss_sub_dim": 0.35307085514068604, "loss_vclub": 0.000804901123046875, "parscale_sim": 0.984375, "step": 1609 }, { "epoch": 1.5421455938697317, "grad_norm": 6.939558506011963, "learning_rate": 1.0263157894736843e-06, "loss": 0.694, "step": 1610 }, { "epoch": 1.5421455938697317, "loss_full_dim": 0.2606905400753021, "loss_main": 0.5321178436279297, "loss_parscale": 0.53125, "loss_sub_dim": 0.27142733335494995, "loss_vclub": 0.000858306884765625, "parscale_sim": 0.984375, "step": 1610 }, { "epoch": 1.543103448275862, "grad_norm": 8.36148738861084, "learning_rate": 1.023684210526316e-06, "loss": 0.5321, "step": 1611 }, { "epoch": 1.543103448275862, "loss_full_dim": 0.24559533596038818, "loss_main": 0.50211501121521, "loss_parscale": 0.5078125, "loss_sub_dim": 0.2565196454524994, "loss_vclub": 0.0010986328125, "parscale_sim": 0.984375, "step": 1611 }, { "epoch": 1.5440613026819925, "grad_norm": 6.469964027404785, "learning_rate": 1.0210526315789475e-06, "loss": 0.5021, "step": 1612 }, { "epoch": 1.5440613026819925, "loss_full_dim": 0.26009804010391235, "loss_main": 0.5321180820465088, "loss_parscale": 0.5390625, "loss_sub_dim": 0.27202001214027405, "loss_vclub": 0.000896453857421875, "parscale_sim": 0.98046875, "step": 1612 }, { "epoch": 1.5450191570881227, "grad_norm": 7.932923793792725, "learning_rate": 1.018421052631579e-06, "loss": 0.5321, "step": 1613 }, { "epoch": 1.5450191570881227, "loss_full_dim": 0.3260743021965027, "loss_main": 0.6648015379905701, "loss_parscale": 0.66796875, "loss_sub_dim": 0.3387272357940674, "loss_vclub": 0.000946044921875, "parscale_sim": 0.98046875, "step": 1613 }, { "epoch": 1.5459770114942528, "grad_norm": 4.898967266082764, "learning_rate": 1.0157894736842105e-06, "loss": 0.6648, "step": 1614 }, { "epoch": 1.5459770114942528, "loss_full_dim": 0.2520967721939087, "loss_main": 0.518585741519928, "loss_parscale": 0.5234375, "loss_sub_dim": 0.2664889693260193, "loss_vclub": 0.000949859619140625, "parscale_sim": 0.984375, "step": 1614 }, { "epoch": 1.5469348659003832, "grad_norm": 8.780598640441895, "learning_rate": 1.013157894736842e-06, "loss": 0.5186, "step": 1615 }, { "epoch": 1.5469348659003832, "loss_full_dim": 0.24600522220134735, "loss_main": 0.5043873190879822, "loss_parscale": 0.5078125, "loss_sub_dim": 0.25838208198547363, "loss_vclub": 0.000858306884765625, "parscale_sim": 0.984375, "step": 1615 }, { "epoch": 1.5478927203065134, "grad_norm": 6.168573379516602, "learning_rate": 1.0105263157894738e-06, "loss": 0.5044, "step": 1616 }, { "epoch": 1.5478927203065134, "loss_full_dim": 0.2723637819290161, "loss_main": 0.5572991371154785, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2849353849887848, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.9765625, "step": 1616 }, { "epoch": 1.5488505747126435, "grad_norm": 6.938534736633301, "learning_rate": 1.0078947368421054e-06, "loss": 0.5573, "step": 1617 }, { "epoch": 1.5488505747126435, "loss_full_dim": 0.2813868224620819, "loss_main": 0.5744286775588989, "loss_parscale": 0.578125, "loss_sub_dim": 0.29304182529449463, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.984375, "step": 1617 }, { "epoch": 1.549808429118774, "grad_norm": 8.3148775100708, "learning_rate": 1.005263157894737e-06, "loss": 0.5744, "step": 1618 }, { "epoch": 1.549808429118774, "loss_full_dim": 0.3258458077907562, "loss_main": 0.6638633012771606, "loss_parscale": 0.6640625, "loss_sub_dim": 0.33801746368408203, "loss_vclub": 0.000797271728515625, "parscale_sim": 0.98046875, "step": 1618 }, { "epoch": 1.5507662835249043, "grad_norm": 8.565882682800293, "learning_rate": 1.0026315789473686e-06, "loss": 0.6639, "step": 1619 }, { "epoch": 1.5507662835249043, "loss_full_dim": 0.21853843331336975, "loss_main": 0.44883283972740173, "loss_parscale": 0.4453125, "loss_sub_dim": 0.23029440641403198, "loss_vclub": 0.000823974609375, "parscale_sim": 0.98046875, "step": 1619 }, { "epoch": 1.5517241379310345, "grad_norm": 6.045705795288086, "learning_rate": 1.0000000000000002e-06, "loss": 0.4488, "step": 1620 }, { "epoch": 1.5517241379310345, "loss_full_dim": 0.2776128053665161, "loss_main": 0.5700501203536987, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2924373149871826, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.984375, "step": 1620 }, { "epoch": 1.5526819923371646, "grad_norm": 7.732439994812012, "learning_rate": 9.973684210526315e-07, "loss": 0.5701, "step": 1621 }, { "epoch": 1.5526819923371646, "loss_full_dim": 0.2562163174152374, "loss_main": 0.5238050222396851, "loss_parscale": 0.515625, "loss_sub_dim": 0.26758867502212524, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.98828125, "step": 1621 }, { "epoch": 1.553639846743295, "grad_norm": 5.2401275634765625, "learning_rate": 9.947368421052631e-07, "loss": 0.5238, "step": 1622 }, { "epoch": 1.553639846743295, "loss_full_dim": 0.257670521736145, "loss_main": 0.5258908867835999, "loss_parscale": 0.53125, "loss_sub_dim": 0.26822036504745483, "loss_vclub": 0.0009613037109375, "parscale_sim": 0.984375, "step": 1622 }, { "epoch": 1.5545977011494254, "grad_norm": 9.097284317016602, "learning_rate": 9.921052631578947e-07, "loss": 0.5259, "step": 1623 }, { "epoch": 1.5545977011494254, "loss_full_dim": 0.36149147152900696, "loss_main": 0.7351914644241333, "loss_parscale": 0.7265625, "loss_sub_dim": 0.37370002269744873, "loss_vclub": 0.000713348388671875, "parscale_sim": 0.98046875, "step": 1623 }, { "epoch": 1.5555555555555556, "grad_norm": 7.721503734588623, "learning_rate": 9.894736842105265e-07, "loss": 0.7352, "step": 1624 }, { "epoch": 1.5555555555555556, "loss_full_dim": 0.3239631652832031, "loss_main": 0.6600184440612793, "loss_parscale": 0.6640625, "loss_sub_dim": 0.33605527877807617, "loss_vclub": 0.000926971435546875, "parscale_sim": 0.984375, "step": 1624 }, { "epoch": 1.5565134099616857, "grad_norm": 10.50611400604248, "learning_rate": 9.86842105263158e-07, "loss": 0.66, "step": 1625 }, { "epoch": 1.5565134099616857, "loss_full_dim": 0.2067486047744751, "loss_main": 0.42225390672683716, "loss_parscale": 0.42578125, "loss_sub_dim": 0.21550528705120087, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.984375, "step": 1625 }, { "epoch": 1.5574712643678161, "grad_norm": 7.029263973236084, "learning_rate": 9.842105263157897e-07, "loss": 0.4223, "step": 1626 }, { "epoch": 1.5574712643678161, "loss_full_dim": 0.28951436281204224, "loss_main": 0.5931764841079712, "loss_parscale": 0.58984375, "loss_sub_dim": 0.30366212129592896, "loss_vclub": 0.001068115234375, "parscale_sim": 0.984375, "step": 1626 }, { "epoch": 1.5584291187739465, "grad_norm": 7.117696285247803, "learning_rate": 9.815789473684212e-07, "loss": 0.5932, "step": 1627 }, { "epoch": 1.5584291187739465, "loss_full_dim": 0.32554182410240173, "loss_main": 0.662028431892395, "loss_parscale": 0.671875, "loss_sub_dim": 0.3364866375923157, "loss_vclub": 0.00103759765625, "parscale_sim": 0.984375, "step": 1627 }, { "epoch": 1.5593869731800765, "grad_norm": 9.555520057678223, "learning_rate": 9.789473684210526e-07, "loss": 0.662, "step": 1628 }, { "epoch": 1.5593869731800765, "loss_full_dim": 0.3124113082885742, "loss_main": 0.6376394033432007, "loss_parscale": 0.63671875, "loss_sub_dim": 0.3252280652523041, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.984375, "step": 1628 }, { "epoch": 1.5603448275862069, "grad_norm": 6.173624038696289, "learning_rate": 9.763157894736842e-07, "loss": 0.6376, "step": 1629 }, { "epoch": 1.5603448275862069, "loss_full_dim": 0.2585851550102234, "loss_main": 0.5292741656303406, "loss_parscale": 0.5390625, "loss_sub_dim": 0.2706890106201172, "loss_vclub": 0.0008544921875, "parscale_sim": 0.984375, "step": 1629 }, { "epoch": 1.5613026819923372, "grad_norm": 7.758520603179932, "learning_rate": 9.736842105263158e-07, "loss": 0.5293, "step": 1630 }, { "epoch": 1.5613026819923372, "loss_full_dim": 0.3046638071537018, "loss_main": 0.6203938722610474, "loss_parscale": 0.625, "loss_sub_dim": 0.3157300651073456, "loss_vclub": 0.0009613037109375, "parscale_sim": 0.9765625, "step": 1630 }, { "epoch": 1.5622605363984674, "grad_norm": 7.782328128814697, "learning_rate": 9.710526315789474e-07, "loss": 0.6204, "step": 1631 }, { "epoch": 1.5622605363984674, "loss_full_dim": 0.35997533798217773, "loss_main": 0.7340778112411499, "loss_parscale": 0.734375, "loss_sub_dim": 0.3741024434566498, "loss_vclub": 0.000835418701171875, "parscale_sim": 0.984375, "step": 1631 }, { "epoch": 1.5632183908045976, "grad_norm": 7.7603278160095215, "learning_rate": 9.68421052631579e-07, "loss": 0.7341, "step": 1632 }, { "epoch": 1.5632183908045976, "loss_full_dim": 0.33206915855407715, "loss_main": 0.6780242919921875, "loss_parscale": 0.6796875, "loss_sub_dim": 0.34595513343811035, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.98828125, "step": 1632 }, { "epoch": 1.564176245210728, "grad_norm": 7.42842960357666, "learning_rate": 9.657894736842107e-07, "loss": 0.678, "step": 1633 }, { "epoch": 1.564176245210728, "loss_full_dim": 0.2867759168148041, "loss_main": 0.5853608846664429, "loss_parscale": 0.59375, "loss_sub_dim": 0.2985849380493164, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.984375, "step": 1633 }, { "epoch": 1.5651340996168583, "grad_norm": 8.724678993225098, "learning_rate": 9.631578947368423e-07, "loss": 0.5854, "step": 1634 }, { "epoch": 1.5651340996168583, "loss_full_dim": 0.2555168569087982, "loss_main": 0.5217725038528442, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26625561714172363, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.98046875, "step": 1634 }, { "epoch": 1.5660919540229885, "grad_norm": 6.615720748901367, "learning_rate": 9.605263157894737e-07, "loss": 0.5218, "step": 1635 }, { "epoch": 1.5660919540229885, "loss_full_dim": 0.26602640748023987, "loss_main": 0.5414224863052368, "loss_parscale": 0.546875, "loss_sub_dim": 0.27539610862731934, "loss_vclub": 0.000843048095703125, "parscale_sim": 0.98828125, "step": 1635 }, { "epoch": 1.5670498084291187, "grad_norm": 7.2694926261901855, "learning_rate": 9.578947368421053e-07, "loss": 0.5414, "step": 1636 }, { "epoch": 1.5670498084291187, "loss_full_dim": 0.23466326296329498, "loss_main": 0.4828298091888428, "loss_parscale": 0.4921875, "loss_sub_dim": 0.2481665313243866, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.984375, "step": 1636 }, { "epoch": 1.568007662835249, "grad_norm": 7.888628959655762, "learning_rate": 9.552631578947368e-07, "loss": 0.4828, "step": 1637 }, { "epoch": 1.568007662835249, "loss_full_dim": 0.26761990785598755, "loss_main": 0.5498929023742676, "loss_parscale": 0.55859375, "loss_sub_dim": 0.28227299451828003, "loss_vclub": 0.00115966796875, "parscale_sim": 0.984375, "step": 1637 }, { "epoch": 1.5689655172413794, "grad_norm": 6.451563835144043, "learning_rate": 9.526315789473685e-07, "loss": 0.5499, "step": 1638 }, { "epoch": 1.5689655172413794, "loss_full_dim": 0.31557002663612366, "loss_main": 0.6461528539657593, "loss_parscale": 0.6484375, "loss_sub_dim": 0.330582857131958, "loss_vclub": 0.0009765625, "parscale_sim": 0.984375, "step": 1638 }, { "epoch": 1.5699233716475096, "grad_norm": 6.828489780426025, "learning_rate": 9.500000000000001e-07, "loss": 0.6462, "step": 1639 }, { "epoch": 1.5699233716475096, "loss_full_dim": 0.31364622712135315, "loss_main": 0.6419447660446167, "loss_parscale": 0.6484375, "loss_sub_dim": 0.32829850912094116, "loss_vclub": 0.0008544921875, "parscale_sim": 0.98046875, "step": 1639 }, { "epoch": 1.5708812260536398, "grad_norm": 10.641986846923828, "learning_rate": 9.473684210526317e-07, "loss": 0.6419, "step": 1640 }, { "epoch": 1.5708812260536398, "loss_full_dim": 0.3001241683959961, "loss_main": 0.6140937209129333, "loss_parscale": 0.6171875, "loss_sub_dim": 0.31396955251693726, "loss_vclub": 0.00080108642578125, "parscale_sim": 0.98046875, "step": 1640 }, { "epoch": 1.5718390804597702, "grad_norm": 8.16611385345459, "learning_rate": 9.447368421052633e-07, "loss": 0.6141, "step": 1641 }, { "epoch": 1.5718390804597702, "loss_full_dim": 0.28698745369911194, "loss_main": 0.5856584310531616, "loss_parscale": 0.5859375, "loss_sub_dim": 0.2986709773540497, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.98828125, "step": 1641 }, { "epoch": 1.5727969348659003, "grad_norm": 7.865530490875244, "learning_rate": 9.421052631578948e-07, "loss": 0.5857, "step": 1642 }, { "epoch": 1.5727969348659003, "loss_full_dim": 0.28530165553092957, "loss_main": 0.5845876932144165, "loss_parscale": 0.59375, "loss_sub_dim": 0.2992860674858093, "loss_vclub": 0.001068115234375, "parscale_sim": 0.984375, "step": 1642 }, { "epoch": 1.5737547892720305, "grad_norm": 6.7336578369140625, "learning_rate": 9.394736842105263e-07, "loss": 0.5846, "step": 1643 }, { "epoch": 1.5737547892720305, "loss_full_dim": 0.27066367864608765, "loss_main": 0.5554198622703552, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2847561836242676, "loss_vclub": 0.000873565673828125, "parscale_sim": 0.9765625, "step": 1643 }, { "epoch": 1.5747126436781609, "grad_norm": 8.910909652709961, "learning_rate": 9.368421052631579e-07, "loss": 0.5554, "step": 1644 }, { "epoch": 1.5747126436781609, "loss_full_dim": 0.23036514222621918, "loss_main": 0.4710674285888672, "loss_parscale": 0.4765625, "loss_sub_dim": 0.2407023012638092, "loss_vclub": 0.0010986328125, "parscale_sim": 0.98828125, "step": 1644 }, { "epoch": 1.5756704980842913, "grad_norm": 6.796816825866699, "learning_rate": 9.342105263157895e-07, "loss": 0.4711, "step": 1645 }, { "epoch": 1.5756704980842913, "loss_full_dim": 0.3055919110774994, "loss_main": 0.6222530603408813, "loss_parscale": 0.6328125, "loss_sub_dim": 0.31666111946105957, "loss_vclub": 0.0010223388671875, "parscale_sim": 0.984375, "step": 1645 }, { "epoch": 1.5766283524904214, "grad_norm": 7.983028411865234, "learning_rate": 9.315789473684212e-07, "loss": 0.6223, "step": 1646 }, { "epoch": 1.5766283524904214, "loss_full_dim": 0.29298004508018494, "loss_main": 0.5983514785766602, "loss_parscale": 0.609375, "loss_sub_dim": 0.3053714334964752, "loss_vclub": 0.000804901123046875, "parscale_sim": 0.98046875, "step": 1646 }, { "epoch": 1.5775862068965516, "grad_norm": 7.424783706665039, "learning_rate": 9.289473684210528e-07, "loss": 0.5984, "step": 1647 }, { "epoch": 1.5775862068965516, "loss_full_dim": 0.26366063952445984, "loss_main": 0.5368351936340332, "loss_parscale": 0.53125, "loss_sub_dim": 0.27317458391189575, "loss_vclub": 0.00106048583984375, "parscale_sim": 0.98046875, "step": 1647 }, { "epoch": 1.578544061302682, "grad_norm": 7.281362056732178, "learning_rate": 9.263157894736844e-07, "loss": 0.5368, "step": 1648 }, { "epoch": 1.578544061302682, "loss_full_dim": 0.23681741952896118, "loss_main": 0.48405641317367554, "loss_parscale": 0.48828125, "loss_sub_dim": 0.24723899364471436, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.98828125, "step": 1648 }, { "epoch": 1.5795019157088124, "grad_norm": 4.90934944152832, "learning_rate": 9.236842105263159e-07, "loss": 0.4841, "step": 1649 }, { "epoch": 1.5795019157088124, "loss_full_dim": 0.28626516461372375, "loss_main": 0.5852707624435425, "loss_parscale": 0.5859375, "loss_sub_dim": 0.29900556802749634, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.98828125, "step": 1649 }, { "epoch": 1.5804597701149425, "grad_norm": 9.358651161193848, "learning_rate": 9.210526315789474e-07, "loss": 0.5853, "step": 1650 }, { "epoch": 1.5804597701149425, "loss_full_dim": 0.2526848316192627, "loss_main": 0.517320990562439, "loss_parscale": 0.515625, "loss_sub_dim": 0.2646361291408539, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.984375, "step": 1650 }, { "epoch": 1.5814176245210727, "grad_norm": 8.646125793457031, "learning_rate": 9.18421052631579e-07, "loss": 0.5173, "step": 1651 }, { "epoch": 1.5814176245210727, "loss_full_dim": 0.323872834444046, "loss_main": 0.658293604850769, "loss_parscale": 0.6640625, "loss_sub_dim": 0.33442074060440063, "loss_vclub": 0.00104522705078125, "parscale_sim": 0.984375, "step": 1651 }, { "epoch": 1.582375478927203, "grad_norm": 7.515748500823975, "learning_rate": 9.157894736842106e-07, "loss": 0.6583, "step": 1652 }, { "epoch": 1.582375478927203, "loss_full_dim": 0.2195880264043808, "loss_main": 0.4496021270751953, "loss_parscale": 0.4453125, "loss_sub_dim": 0.2300141155719757, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.984375, "step": 1652 }, { "epoch": 1.5833333333333335, "grad_norm": 5.287741184234619, "learning_rate": 9.131578947368422e-07, "loss": 0.4496, "step": 1653 }, { "epoch": 1.5833333333333335, "loss_full_dim": 0.20197471976280212, "loss_main": 0.4144861400127411, "loss_parscale": 0.421875, "loss_sub_dim": 0.21251142024993896, "loss_vclub": 0.00093841552734375, "parscale_sim": 0.984375, "step": 1653 }, { "epoch": 1.5842911877394636, "grad_norm": 6.198366165161133, "learning_rate": 9.105263157894737e-07, "loss": 0.4145, "step": 1654 }, { "epoch": 1.5842911877394636, "loss_full_dim": 0.3079392611980438, "loss_main": 0.6297237873077393, "loss_parscale": 0.6328125, "loss_sub_dim": 0.3217845559120178, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.984375, "step": 1654 }, { "epoch": 1.5852490421455938, "grad_norm": 7.414093971252441, "learning_rate": 9.078947368421054e-07, "loss": 0.6297, "step": 1655 }, { "epoch": 1.5852490421455938, "loss_full_dim": 0.2880968451499939, "loss_main": 0.5868696570396423, "loss_parscale": 0.59375, "loss_sub_dim": 0.29877281188964844, "loss_vclub": 0.00089263916015625, "parscale_sim": 0.984375, "step": 1655 }, { "epoch": 1.5862068965517242, "grad_norm": 6.340543270111084, "learning_rate": 9.05263157894737e-07, "loss": 0.5869, "step": 1656 }, { "epoch": 1.5862068965517242, "loss_full_dim": 0.24505680799484253, "loss_main": 0.5017655491828918, "loss_parscale": 0.51171875, "loss_sub_dim": 0.2567087411880493, "loss_vclub": 0.0009613037109375, "parscale_sim": 0.98828125, "step": 1656 }, { "epoch": 1.5871647509578544, "grad_norm": 6.151679515838623, "learning_rate": 9.026315789473685e-07, "loss": 0.5018, "step": 1657 }, { "epoch": 1.5871647509578544, "loss_full_dim": 0.3019888997077942, "loss_main": 0.6169933080673218, "loss_parscale": 0.61328125, "loss_sub_dim": 0.3150043785572052, "loss_vclub": 0.0007476806640625, "parscale_sim": 0.984375, "step": 1657 }, { "epoch": 1.5881226053639845, "grad_norm": 11.755770683288574, "learning_rate": 9.000000000000001e-07, "loss": 0.617, "step": 1658 }, { "epoch": 1.5881226053639845, "loss_full_dim": 0.2634030282497406, "loss_main": 0.5372769832611084, "loss_parscale": 0.54296875, "loss_sub_dim": 0.2738739848136902, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.984375, "step": 1658 }, { "epoch": 1.589080459770115, "grad_norm": 9.702309608459473, "learning_rate": 8.973684210526316e-07, "loss": 0.5373, "step": 1659 }, { "epoch": 1.589080459770115, "loss_full_dim": 0.29874590039253235, "loss_main": 0.6109675168991089, "loss_parscale": 0.6171875, "loss_sub_dim": 0.3122216463088989, "loss_vclub": 0.0009613037109375, "parscale_sim": 0.984375, "step": 1659 }, { "epoch": 1.5900383141762453, "grad_norm": 7.908725261688232, "learning_rate": 8.947368421052632e-07, "loss": 0.611, "step": 1660 }, { "epoch": 1.5900383141762453, "loss_full_dim": 0.2567756772041321, "loss_main": 0.5236423015594482, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26686662435531616, "loss_vclub": 0.0010528564453125, "parscale_sim": 0.98828125, "step": 1660 }, { "epoch": 1.5909961685823755, "grad_norm": 5.750856876373291, "learning_rate": 8.921052631578948e-07, "loss": 0.5236, "step": 1661 }, { "epoch": 1.5909961685823755, "loss_full_dim": 0.2759225368499756, "loss_main": 0.5629702806472778, "loss_parscale": 0.5625, "loss_sub_dim": 0.28704774379730225, "loss_vclub": 0.0009765625, "parscale_sim": 0.984375, "step": 1661 }, { "epoch": 1.5919540229885056, "grad_norm": 5.0707478523254395, "learning_rate": 8.894736842105264e-07, "loss": 0.563, "step": 1662 }, { "epoch": 1.5919540229885056, "loss_full_dim": 0.23117230832576752, "loss_main": 0.4754624366760254, "loss_parscale": 0.482421875, "loss_sub_dim": 0.24429014325141907, "loss_vclub": 0.000797271728515625, "parscale_sim": 0.984375, "step": 1662 }, { "epoch": 1.592911877394636, "grad_norm": 7.15294075012207, "learning_rate": 8.868421052631581e-07, "loss": 0.4755, "step": 1663 }, { "epoch": 1.592911877394636, "loss_full_dim": 0.2872697710990906, "loss_main": 0.5841541290283203, "loss_parscale": 0.59375, "loss_sub_dim": 0.29688435792922974, "loss_vclub": 0.00104522705078125, "parscale_sim": 0.98046875, "step": 1663 }, { "epoch": 1.5938697318007664, "grad_norm": 8.544384002685547, "learning_rate": 8.842105263157895e-07, "loss": 0.5842, "step": 1664 }, { "epoch": 1.5938697318007664, "loss_full_dim": 0.2581670880317688, "loss_main": 0.529678225517273, "loss_parscale": 0.53125, "loss_sub_dim": 0.27151116728782654, "loss_vclub": 0.000732421875, "parscale_sim": 0.984375, "step": 1664 }, { "epoch": 1.5948275862068966, "grad_norm": 6.22068452835083, "learning_rate": 8.815789473684211e-07, "loss": 0.5297, "step": 1665 }, { "epoch": 1.5948275862068966, "loss_full_dim": 0.3197077214717865, "loss_main": 0.6502970457077026, "loss_parscale": 0.6484375, "loss_sub_dim": 0.33058929443359375, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.984375, "step": 1665 }, { "epoch": 1.5957854406130267, "grad_norm": 9.596500396728516, "learning_rate": 8.789473684210527e-07, "loss": 0.6503, "step": 1666 }, { "epoch": 1.5957854406130267, "loss_full_dim": 0.24436461925506592, "loss_main": 0.4991057515144348, "loss_parscale": 0.5, "loss_sub_dim": 0.2547411322593689, "loss_vclub": 0.000835418701171875, "parscale_sim": 0.98046875, "step": 1666 }, { "epoch": 1.5967432950191571, "grad_norm": 6.224969863891602, "learning_rate": 8.763157894736843e-07, "loss": 0.4991, "step": 1667 }, { "epoch": 1.5967432950191571, "loss_full_dim": 0.23725011944770813, "loss_main": 0.48654860258102417, "loss_parscale": 0.48828125, "loss_sub_dim": 0.24929848313331604, "loss_vclub": 0.000896453857421875, "parscale_sim": 0.984375, "step": 1667 }, { "epoch": 1.5977011494252875, "grad_norm": 7.16140604019165, "learning_rate": 8.736842105263159e-07, "loss": 0.4865, "step": 1668 }, { "epoch": 1.5977011494252875, "loss_full_dim": 0.27974578738212585, "loss_main": 0.5697741508483887, "loss_parscale": 0.578125, "loss_sub_dim": 0.2900283932685852, "loss_vclub": 0.000885009765625, "parscale_sim": 0.98828125, "step": 1668 }, { "epoch": 1.5986590038314177, "grad_norm": 5.257695198059082, "learning_rate": 8.710526315789475e-07, "loss": 0.5698, "step": 1669 }, { "epoch": 1.5986590038314177, "loss_full_dim": 0.2659642696380615, "loss_main": 0.5435097217559814, "loss_parscale": 0.54296875, "loss_sub_dim": 0.2775454521179199, "loss_vclub": 0.000946044921875, "parscale_sim": 0.98828125, "step": 1669 }, { "epoch": 1.5996168582375478, "grad_norm": 7.650420188903809, "learning_rate": 8.68421052631579e-07, "loss": 0.5435, "step": 1670 }, { "epoch": 1.5996168582375478, "loss_full_dim": 0.23310860991477966, "loss_main": 0.47815755009651184, "loss_parscale": 0.48046875, "loss_sub_dim": 0.24504894018173218, "loss_vclub": 0.000946044921875, "parscale_sim": 0.98828125, "step": 1670 }, { "epoch": 1.6005747126436782, "grad_norm": 5.594642162322998, "learning_rate": 8.657894736842105e-07, "loss": 0.4782, "step": 1671 }, { "epoch": 1.6005747126436782, "loss_full_dim": 0.32519304752349854, "loss_main": 0.6639251112937927, "loss_parscale": 0.66796875, "loss_sub_dim": 0.3387320637702942, "loss_vclub": 0.0009307861328125, "parscale_sim": 0.98046875, "step": 1671 }, { "epoch": 1.6015325670498084, "grad_norm": 8.198210716247559, "learning_rate": 8.631578947368421e-07, "loss": 0.6639, "step": 1672 }, { "epoch": 1.6015325670498084, "loss_full_dim": 0.24852487444877625, "loss_main": 0.5070033073425293, "loss_parscale": 0.5078125, "loss_sub_dim": 0.25847840309143066, "loss_vclub": 0.0010223388671875, "parscale_sim": 0.98046875, "step": 1672 }, { "epoch": 1.6024904214559386, "grad_norm": 5.805592060089111, "learning_rate": 8.605263157894737e-07, "loss": 0.507, "step": 1673 }, { "epoch": 1.6024904214559386, "loss_full_dim": 0.2380826473236084, "loss_main": 0.48796531558036804, "loss_parscale": 0.4921875, "loss_sub_dim": 0.24988266825675964, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.98046875, "step": 1673 }, { "epoch": 1.603448275862069, "grad_norm": 6.575294494628906, "learning_rate": 8.578947368421054e-07, "loss": 0.488, "step": 1674 }, { "epoch": 1.603448275862069, "loss_full_dim": 0.26912155747413635, "loss_main": 0.5495554208755493, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2804338335990906, "loss_vclub": 0.00102996826171875, "parscale_sim": 0.984375, "step": 1674 }, { "epoch": 1.6044061302681993, "grad_norm": 8.43377685546875, "learning_rate": 8.55263157894737e-07, "loss": 0.5496, "step": 1675 }, { "epoch": 1.6044061302681993, "loss_full_dim": 0.22108635306358337, "loss_main": 0.4530077576637268, "loss_parscale": 0.462890625, "loss_sub_dim": 0.23192140460014343, "loss_vclub": 0.00099945068359375, "parscale_sim": 0.984375, "step": 1675 }, { "epoch": 1.6053639846743295, "grad_norm": 5.313878059387207, "learning_rate": 8.526315789473685e-07, "loss": 0.453, "step": 1676 }, { "epoch": 1.6053639846743295, "loss_full_dim": 0.30016574263572693, "loss_main": 0.6126976013183594, "loss_parscale": 0.625, "loss_sub_dim": 0.31253182888031006, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.9765625, "step": 1676 }, { "epoch": 1.6063218390804597, "grad_norm": 9.43499755859375, "learning_rate": 8.500000000000001e-07, "loss": 0.6127, "step": 1677 }, { "epoch": 1.6063218390804597, "loss_full_dim": 0.282795786857605, "loss_main": 0.5772824287414551, "loss_parscale": 0.5859375, "loss_sub_dim": 0.2944866418838501, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.984375, "step": 1677 }, { "epoch": 1.60727969348659, "grad_norm": 5.65078592300415, "learning_rate": 8.473684210526316e-07, "loss": 0.5773, "step": 1678 }, { "epoch": 1.60727969348659, "loss_full_dim": 0.30360186100006104, "loss_main": 0.6194963455200195, "loss_parscale": 0.62890625, "loss_sub_dim": 0.3158944845199585, "loss_vclub": 0.00102996826171875, "parscale_sim": 0.984375, "step": 1678 }, { "epoch": 1.6082375478927204, "grad_norm": 4.949225902557373, "learning_rate": 8.447368421052632e-07, "loss": 0.6195, "step": 1679 }, { "epoch": 1.6082375478927204, "loss_full_dim": 0.24836350977420807, "loss_main": 0.5085485577583313, "loss_parscale": 0.51171875, "loss_sub_dim": 0.26018503308296204, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.97265625, "step": 1679 }, { "epoch": 1.6091954022988506, "grad_norm": 6.8458251953125, "learning_rate": 8.421052631578948e-07, "loss": 0.5085, "step": 1680 }, { "epoch": 1.6091954022988506, "loss_full_dim": 0.3142143189907074, "loss_main": 0.6410316228866577, "loss_parscale": 0.640625, "loss_sub_dim": 0.32681727409362793, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.98828125, "step": 1680 }, { "epoch": 1.6101532567049808, "grad_norm": 8.975677490234375, "learning_rate": 8.394736842105263e-07, "loss": 0.641, "step": 1681 }, { "epoch": 1.6101532567049808, "loss_full_dim": 0.28851306438446045, "loss_main": 0.5893349647521973, "loss_parscale": 0.59375, "loss_sub_dim": 0.3008219003677368, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.984375, "step": 1681 }, { "epoch": 1.6111111111111112, "grad_norm": 6.992921829223633, "learning_rate": 8.36842105263158e-07, "loss": 0.5893, "step": 1682 }, { "epoch": 1.6111111111111112, "loss_full_dim": 0.24959154427051544, "loss_main": 0.5104091167449951, "loss_parscale": 0.51171875, "loss_sub_dim": 0.26081758737564087, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.98046875, "step": 1682 }, { "epoch": 1.6120689655172413, "grad_norm": 8.329347610473633, "learning_rate": 8.342105263157896e-07, "loss": 0.5104, "step": 1683 }, { "epoch": 1.6120689655172413, "loss_full_dim": 0.2297409623861313, "loss_main": 0.47120657563209534, "loss_parscale": 0.47265625, "loss_sub_dim": 0.24146561324596405, "loss_vclub": 0.000888824462890625, "parscale_sim": 0.984375, "step": 1683 }, { "epoch": 1.6130268199233715, "grad_norm": 6.2106781005859375, "learning_rate": 8.315789473684212e-07, "loss": 0.4712, "step": 1684 }, { "epoch": 1.6130268199233715, "loss_full_dim": 0.2751995325088501, "loss_main": 0.5615295171737671, "loss_parscale": 0.5625, "loss_sub_dim": 0.2863299548625946, "loss_vclub": 0.000843048095703125, "parscale_sim": 0.9765625, "step": 1684 }, { "epoch": 1.6139846743295019, "grad_norm": 5.6482768058776855, "learning_rate": 8.289473684210527e-07, "loss": 0.5615, "step": 1685 }, { "epoch": 1.6139846743295019, "loss_full_dim": 0.24443966150283813, "loss_main": 0.5016185641288757, "loss_parscale": 0.5, "loss_sub_dim": 0.2571789026260376, "loss_vclub": 0.001129150390625, "parscale_sim": 0.98046875, "step": 1685 }, { "epoch": 1.6149425287356323, "grad_norm": 6.427104473114014, "learning_rate": 8.263157894736843e-07, "loss": 0.5016, "step": 1686 }, { "epoch": 1.6149425287356323, "loss_full_dim": 0.2525297999382019, "loss_main": 0.5154921412467957, "loss_parscale": 0.51953125, "loss_sub_dim": 0.26296234130859375, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.984375, "step": 1686 }, { "epoch": 1.6159003831417624, "grad_norm": 5.530725479125977, "learning_rate": 8.236842105263158e-07, "loss": 0.5155, "step": 1687 }, { "epoch": 1.6159003831417624, "loss_full_dim": 0.26729273796081543, "loss_main": 0.5472180843353271, "loss_parscale": 0.546875, "loss_sub_dim": 0.2799253463745117, "loss_vclub": 0.0008544921875, "parscale_sim": 0.98046875, "step": 1687 }, { "epoch": 1.6168582375478926, "grad_norm": 6.6412200927734375, "learning_rate": 8.210526315789474e-07, "loss": 0.5472, "step": 1688 }, { "epoch": 1.6168582375478926, "loss_full_dim": 0.2496042102575302, "loss_main": 0.5114153623580933, "loss_parscale": 0.515625, "loss_sub_dim": 0.26181113719940186, "loss_vclub": 0.00107574462890625, "parscale_sim": 0.984375, "step": 1688 }, { "epoch": 1.617816091954023, "grad_norm": 6.987290859222412, "learning_rate": 8.18421052631579e-07, "loss": 0.5114, "step": 1689 }, { "epoch": 1.617816091954023, "loss_full_dim": 0.2356293797492981, "loss_main": 0.4814455509185791, "loss_parscale": 0.484375, "loss_sub_dim": 0.245816171169281, "loss_vclub": 0.000919342041015625, "parscale_sim": 0.9765625, "step": 1689 }, { "epoch": 1.6187739463601534, "grad_norm": 10.004325866699219, "learning_rate": 8.157894736842106e-07, "loss": 0.4814, "step": 1690 }, { "epoch": 1.6187739463601534, "loss_full_dim": 0.24421198666095734, "loss_main": 0.49841171503067017, "loss_parscale": 0.498046875, "loss_sub_dim": 0.254199743270874, "loss_vclub": 0.0009002685546875, "parscale_sim": 0.984375, "step": 1690 }, { "epoch": 1.6197318007662835, "grad_norm": 5.588013172149658, "learning_rate": 8.131578947368423e-07, "loss": 0.4984, "step": 1691 }, { "epoch": 1.6197318007662835, "loss_full_dim": 0.29768332839012146, "loss_main": 0.6059521436691284, "loss_parscale": 0.609375, "loss_sub_dim": 0.30826884508132935, "loss_vclub": 0.000835418701171875, "parscale_sim": 0.984375, "step": 1691 }, { "epoch": 1.6206896551724137, "grad_norm": 4.319547653198242, "learning_rate": 8.105263157894736e-07, "loss": 0.606, "step": 1692 }, { "epoch": 1.6206896551724137, "loss_full_dim": 0.3176726996898651, "loss_main": 0.648388147354126, "loss_parscale": 0.65234375, "loss_sub_dim": 0.33071544766426086, "loss_vclub": 0.00099945068359375, "parscale_sim": 0.98828125, "step": 1692 }, { "epoch": 1.621647509578544, "grad_norm": 8.634143829345703, "learning_rate": 8.078947368421053e-07, "loss": 0.6484, "step": 1693 }, { "epoch": 1.621647509578544, "loss_full_dim": 0.28862521052360535, "loss_main": 0.5886320471763611, "loss_parscale": 0.59375, "loss_sub_dim": 0.30000683665275574, "loss_vclub": 0.000926971435546875, "parscale_sim": 0.984375, "step": 1693 }, { "epoch": 1.6226053639846745, "grad_norm": 7.168097496032715, "learning_rate": 8.052631578947369e-07, "loss": 0.5886, "step": 1694 }, { "epoch": 1.6226053639846745, "loss_full_dim": 0.28069576621055603, "loss_main": 0.574618399143219, "loss_parscale": 0.5859375, "loss_sub_dim": 0.29392263293266296, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.984375, "step": 1694 }, { "epoch": 1.6235632183908046, "grad_norm": 8.088167190551758, "learning_rate": 8.026315789473685e-07, "loss": 0.5746, "step": 1695 }, { "epoch": 1.6235632183908046, "loss_full_dim": 0.23867768049240112, "loss_main": 0.48748230934143066, "loss_parscale": 0.4921875, "loss_sub_dim": 0.24880462884902954, "loss_vclub": 0.00099945068359375, "parscale_sim": 0.984375, "step": 1695 }, { "epoch": 1.6245210727969348, "grad_norm": 4.805434703826904, "learning_rate": 8.000000000000001e-07, "loss": 0.4875, "step": 1696 }, { "epoch": 1.6245210727969348, "loss_full_dim": 0.2575283944606781, "loss_main": 0.5258711576461792, "loss_parscale": 0.5234375, "loss_sub_dim": 0.2683427929878235, "loss_vclub": 0.0011444091796875, "parscale_sim": 0.984375, "step": 1696 }, { "epoch": 1.6254789272030652, "grad_norm": 6.6694111824035645, "learning_rate": 7.973684210526317e-07, "loss": 0.5259, "step": 1697 }, { "epoch": 1.6254789272030652, "loss_full_dim": 0.2637932598590851, "loss_main": 0.5382480025291443, "loss_parscale": 0.5390625, "loss_sub_dim": 0.2744547426700592, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.984375, "step": 1697 }, { "epoch": 1.6264367816091954, "grad_norm": 5.1627373695373535, "learning_rate": 7.947368421052632e-07, "loss": 0.5382, "step": 1698 }, { "epoch": 1.6264367816091954, "loss_full_dim": 0.2867725193500519, "loss_main": 0.5851378440856934, "loss_parscale": 0.5859375, "loss_sub_dim": 0.29836535453796387, "loss_vclub": 0.000804901123046875, "parscale_sim": 0.984375, "step": 1698 }, { "epoch": 1.6273946360153255, "grad_norm": 7.617204189300537, "learning_rate": 7.921052631578947e-07, "loss": 0.5851, "step": 1699 }, { "epoch": 1.6273946360153255, "loss_full_dim": 0.24384376406669617, "loss_main": 0.5002022981643677, "loss_parscale": 0.5078125, "loss_sub_dim": 0.2563585042953491, "loss_vclub": 0.00110626220703125, "parscale_sim": 0.984375, "step": 1699 }, { "epoch": 1.628352490421456, "grad_norm": 8.731095314025879, "learning_rate": 7.894736842105263e-07, "loss": 0.5002, "step": 1700 }, { "epoch": 1.628352490421456, "loss_full_dim": 0.26765191555023193, "loss_main": 0.5491011142730713, "loss_parscale": 0.5546875, "loss_sub_dim": 0.28144919872283936, "loss_vclub": 0.000720977783203125, "parscale_sim": 0.98046875, "step": 1700 }, { "epoch": 1.6293103448275863, "grad_norm": 6.929474830627441, "learning_rate": 7.86842105263158e-07, "loss": 0.5491, "step": 1701 }, { "epoch": 1.6293103448275863, "loss_full_dim": 0.2286425530910492, "loss_main": 0.4667759835720062, "loss_parscale": 0.474609375, "loss_sub_dim": 0.23813343048095703, "loss_vclub": 0.001007080078125, "parscale_sim": 0.98046875, "step": 1701 }, { "epoch": 1.6302681992337165, "grad_norm": 5.306651592254639, "learning_rate": 7.842105263157896e-07, "loss": 0.4668, "step": 1702 }, { "epoch": 1.6302681992337165, "loss_full_dim": 0.2112416923046112, "loss_main": 0.43289968371391296, "loss_parscale": 0.443359375, "loss_sub_dim": 0.22165799140930176, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.98828125, "step": 1702 }, { "epoch": 1.6312260536398466, "grad_norm": 4.543445587158203, "learning_rate": 7.815789473684211e-07, "loss": 0.4329, "step": 1703 }, { "epoch": 1.6312260536398466, "loss_full_dim": 0.2702576518058777, "loss_main": 0.5522418022155762, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2819841206073761, "loss_vclub": 0.001068115234375, "parscale_sim": 0.98046875, "step": 1703 }, { "epoch": 1.632183908045977, "grad_norm": 7.591314792633057, "learning_rate": 7.789473684210527e-07, "loss": 0.5522, "step": 1704 }, { "epoch": 1.632183908045977, "loss_full_dim": 0.23690542578697205, "loss_main": 0.4855753481388092, "loss_parscale": 0.48828125, "loss_sub_dim": 0.24866992235183716, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.984375, "step": 1704 }, { "epoch": 1.6331417624521074, "grad_norm": 8.443010330200195, "learning_rate": 7.763157894736843e-07, "loss": 0.4856, "step": 1705 }, { "epoch": 1.6331417624521074, "loss_full_dim": 0.29221487045288086, "loss_main": 0.5944967865943909, "loss_parscale": 0.60546875, "loss_sub_dim": 0.30228191614151, "loss_vclub": 0.00104522705078125, "parscale_sim": 0.98828125, "step": 1705 }, { "epoch": 1.6340996168582376, "grad_norm": 10.611771583557129, "learning_rate": 7.736842105263158e-07, "loss": 0.5945, "step": 1706 }, { "epoch": 1.6340996168582376, "loss_full_dim": 0.2866276800632477, "loss_main": 0.5848509073257446, "loss_parscale": 0.58203125, "loss_sub_dim": 0.29822319746017456, "loss_vclub": 0.00091552734375, "parscale_sim": 0.98828125, "step": 1706 }, { "epoch": 1.6350574712643677, "grad_norm": 6.654287338256836, "learning_rate": 7.710526315789474e-07, "loss": 0.5849, "step": 1707 }, { "epoch": 1.6350574712643677, "loss_full_dim": 0.29695361852645874, "loss_main": 0.6051264405250549, "loss_parscale": 0.6171875, "loss_sub_dim": 0.3081728219985962, "loss_vclub": 0.000698089599609375, "parscale_sim": 0.9765625, "step": 1707 }, { "epoch": 1.6360153256704981, "grad_norm": 7.959013938903809, "learning_rate": 7.684210526315789e-07, "loss": 0.6051, "step": 1708 }, { "epoch": 1.6360153256704981, "loss_full_dim": 0.2597392797470093, "loss_main": 0.531035304069519, "loss_parscale": 0.5390625, "loss_sub_dim": 0.27129602432250977, "loss_vclub": 0.000926971435546875, "parscale_sim": 0.984375, "step": 1708 }, { "epoch": 1.6369731800766285, "grad_norm": 4.128355503082275, "learning_rate": 7.657894736842106e-07, "loss": 0.531, "step": 1709 }, { "epoch": 1.6369731800766285, "loss_full_dim": 0.24293483793735504, "loss_main": 0.497306764125824, "loss_parscale": 0.5, "loss_sub_dim": 0.25437191128730774, "loss_vclub": 0.000904083251953125, "parscale_sim": 0.984375, "step": 1709 }, { "epoch": 1.6379310344827587, "grad_norm": 6.819427490234375, "learning_rate": 7.631578947368422e-07, "loss": 0.4973, "step": 1710 }, { "epoch": 1.6379310344827587, "loss_full_dim": 0.2405693382024765, "loss_main": 0.4903212785720825, "loss_parscale": 0.490234375, "loss_sub_dim": 0.24975192546844482, "loss_vclub": 0.00109100341796875, "parscale_sim": 0.984375, "step": 1710 }, { "epoch": 1.6388888888888888, "grad_norm": 7.865030765533447, "learning_rate": 7.605263157894738e-07, "loss": 0.4903, "step": 1711 }, { "epoch": 1.6388888888888888, "loss_full_dim": 0.2831250727176666, "loss_main": 0.5760132074356079, "loss_parscale": 0.578125, "loss_sub_dim": 0.2928881049156189, "loss_vclub": 0.00118255615234375, "parscale_sim": 0.984375, "step": 1711 }, { "epoch": 1.6398467432950192, "grad_norm": 6.685212135314941, "learning_rate": 7.578947368421054e-07, "loss": 0.576, "step": 1712 }, { "epoch": 1.6398467432950192, "loss_full_dim": 0.2770063281059265, "loss_main": 0.5650392770767212, "loss_parscale": 0.55859375, "loss_sub_dim": 0.2880329191684723, "loss_vclub": 0.0008544921875, "parscale_sim": 0.984375, "step": 1712 }, { "epoch": 1.6408045977011494, "grad_norm": 8.996415138244629, "learning_rate": 7.552631578947369e-07, "loss": 0.565, "step": 1713 }, { "epoch": 1.6408045977011494, "loss_full_dim": 0.23546184599399567, "loss_main": 0.4803426265716553, "loss_parscale": 0.482421875, "loss_sub_dim": 0.2448807656764984, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.984375, "step": 1713 }, { "epoch": 1.6417624521072796, "grad_norm": 5.414271354675293, "learning_rate": 7.526315789473684e-07, "loss": 0.4803, "step": 1714 }, { "epoch": 1.6417624521072796, "loss_full_dim": 0.2978515326976776, "loss_main": 0.6075451374053955, "loss_parscale": 0.609375, "loss_sub_dim": 0.3096936345100403, "loss_vclub": 0.0009613037109375, "parscale_sim": 0.984375, "step": 1714 }, { "epoch": 1.64272030651341, "grad_norm": 5.758373737335205, "learning_rate": 7.5e-07, "loss": 0.6075, "step": 1715 }, { "epoch": 1.64272030651341, "loss_full_dim": 0.2956203520298004, "loss_main": 0.6045821905136108, "loss_parscale": 0.609375, "loss_sub_dim": 0.3089618682861328, "loss_vclub": 0.001190185546875, "parscale_sim": 0.98828125, "step": 1715 }, { "epoch": 1.6436781609195403, "grad_norm": 6.4064741134643555, "learning_rate": 7.473684210526316e-07, "loss": 0.6046, "step": 1716 }, { "epoch": 1.6436781609195403, "loss_full_dim": 0.28089770674705505, "loss_main": 0.5741734504699707, "loss_parscale": 0.578125, "loss_sub_dim": 0.29327577352523804, "loss_vclub": 0.00096893310546875, "parscale_sim": 0.984375, "step": 1716 }, { "epoch": 1.6446360153256705, "grad_norm": 8.629371643066406, "learning_rate": 7.447368421052632e-07, "loss": 0.5742, "step": 1717 }, { "epoch": 1.6446360153256705, "loss_full_dim": 0.27700379490852356, "loss_main": 0.5642057657241821, "loss_parscale": 0.5625, "loss_sub_dim": 0.28720200061798096, "loss_vclub": 0.000865936279296875, "parscale_sim": 0.98046875, "step": 1717 }, { "epoch": 1.6455938697318007, "grad_norm": 6.046170711517334, "learning_rate": 7.421052631578949e-07, "loss": 0.5642, "step": 1718 }, { "epoch": 1.6455938697318007, "loss_full_dim": 0.29448163509368896, "loss_main": 0.6002248525619507, "loss_parscale": 0.60546875, "loss_sub_dim": 0.30574318766593933, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.98828125, "step": 1718 }, { "epoch": 1.646551724137931, "grad_norm": 6.357515811920166, "learning_rate": 7.394736842105265e-07, "loss": 0.6002, "step": 1719 }, { "epoch": 1.646551724137931, "loss_full_dim": 0.2688697278499603, "loss_main": 0.5472028255462646, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2783331274986267, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.984375, "step": 1719 }, { "epoch": 1.6475095785440614, "grad_norm": 6.169459342956543, "learning_rate": 7.368421052631579e-07, "loss": 0.5472, "step": 1720 }, { "epoch": 1.6475095785440614, "loss_full_dim": 0.2756790816783905, "loss_main": 0.5607767105102539, "loss_parscale": 0.56640625, "loss_sub_dim": 0.285097599029541, "loss_vclub": 0.0008544921875, "parscale_sim": 0.98828125, "step": 1720 }, { "epoch": 1.6484674329501916, "grad_norm": 6.938109874725342, "learning_rate": 7.342105263157895e-07, "loss": 0.5608, "step": 1721 }, { "epoch": 1.6484674329501916, "loss_full_dim": 0.28709468245506287, "loss_main": 0.5876526832580566, "loss_parscale": 0.59375, "loss_sub_dim": 0.30055803060531616, "loss_vclub": 0.0009307861328125, "parscale_sim": 0.984375, "step": 1721 }, { "epoch": 1.6494252873563218, "grad_norm": 9.2144775390625, "learning_rate": 7.315789473684211e-07, "loss": 0.5877, "step": 1722 }, { "epoch": 1.6494252873563218, "loss_full_dim": 0.2664441764354706, "loss_main": 0.5425406694412231, "loss_parscale": 0.546875, "loss_sub_dim": 0.27609652280807495, "loss_vclub": 0.000934600830078125, "parscale_sim": 0.984375, "step": 1722 }, { "epoch": 1.6503831417624522, "grad_norm": 7.396927833557129, "learning_rate": 7.289473684210527e-07, "loss": 0.5425, "step": 1723 }, { "epoch": 1.6503831417624522, "loss_full_dim": 0.264554888010025, "loss_main": 0.5406920909881592, "loss_parscale": 0.54296875, "loss_sub_dim": 0.27613717317581177, "loss_vclub": 0.001068115234375, "parscale_sim": 0.9765625, "step": 1723 }, { "epoch": 1.6513409961685823, "grad_norm": 6.490091323852539, "learning_rate": 7.263157894736843e-07, "loss": 0.5407, "step": 1724 }, { "epoch": 1.6513409961685823, "loss_full_dim": 0.24751275777816772, "loss_main": 0.506250262260437, "loss_parscale": 0.5078125, "loss_sub_dim": 0.2587375044822693, "loss_vclub": 0.0010223388671875, "parscale_sim": 0.984375, "step": 1724 }, { "epoch": 1.6522988505747125, "grad_norm": 4.777124881744385, "learning_rate": 7.236842105263158e-07, "loss": 0.5063, "step": 1725 }, { "epoch": 1.6522988505747125, "loss_full_dim": 0.2618204653263092, "loss_main": 0.5339954495429993, "loss_parscale": 0.546875, "loss_sub_dim": 0.27217498421669006, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.984375, "step": 1725 }, { "epoch": 1.6532567049808429, "grad_norm": 6.214465141296387, "learning_rate": 7.210526315789475e-07, "loss": 0.534, "step": 1726 }, { "epoch": 1.6532567049808429, "loss_full_dim": 0.2104220688343048, "loss_main": 0.4346393346786499, "loss_parscale": 0.4375, "loss_sub_dim": 0.2242172658443451, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.984375, "step": 1726 }, { "epoch": 1.6542145593869733, "grad_norm": 8.6441011428833, "learning_rate": 7.184210526315791e-07, "loss": 0.4346, "step": 1727 }, { "epoch": 1.6542145593869733, "loss_full_dim": 0.2531913220882416, "loss_main": 0.5195236206054688, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26633232831954956, "loss_vclub": 0.00090789794921875, "parscale_sim": 0.98828125, "step": 1727 }, { "epoch": 1.6551724137931034, "grad_norm": 8.76309585571289, "learning_rate": 7.157894736842106e-07, "loss": 0.5195, "step": 1728 }, { "epoch": 1.6551724137931034, "loss_full_dim": 0.27435681223869324, "loss_main": 0.560492992401123, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2861362099647522, "loss_vclub": 0.00083160400390625, "parscale_sim": 0.984375, "step": 1728 }, { "epoch": 1.6561302681992336, "grad_norm": 6.013772487640381, "learning_rate": 7.131578947368422e-07, "loss": 0.5605, "step": 1729 }, { "epoch": 1.6561302681992336, "loss_full_dim": 0.2699492871761322, "loss_main": 0.5526022911071777, "loss_parscale": 0.5546875, "loss_sub_dim": 0.28265297412872314, "loss_vclub": 0.000946044921875, "parscale_sim": 0.98828125, "step": 1729 }, { "epoch": 1.657088122605364, "grad_norm": 7.6068925857543945, "learning_rate": 7.105263157894737e-07, "loss": 0.5526, "step": 1730 }, { "epoch": 1.657088122605364, "loss_full_dim": 0.2678692638874054, "loss_main": 0.54671311378479, "loss_parscale": 0.5546875, "loss_sub_dim": 0.27884382009506226, "loss_vclub": 0.00099945068359375, "parscale_sim": 0.98046875, "step": 1730 }, { "epoch": 1.6580459770114944, "grad_norm": 8.231463432312012, "learning_rate": 7.078947368421053e-07, "loss": 0.5467, "step": 1731 }, { "epoch": 1.6580459770114944, "loss_full_dim": 0.25831010937690735, "loss_main": 0.5278825759887695, "loss_parscale": 0.52734375, "loss_sub_dim": 0.26957249641418457, "loss_vclub": 0.0010223388671875, "parscale_sim": 0.98828125, "step": 1731 }, { "epoch": 1.6590038314176245, "grad_norm": 8.416131019592285, "learning_rate": 7.052631578947369e-07, "loss": 0.5279, "step": 1732 }, { "epoch": 1.6590038314176245, "loss_full_dim": 0.23971575498580933, "loss_main": 0.4915315806865692, "loss_parscale": 0.4921875, "loss_sub_dim": 0.2518158257007599, "loss_vclub": 0.000934600830078125, "parscale_sim": 0.984375, "step": 1732 }, { "epoch": 1.6599616858237547, "grad_norm": 4.740548133850098, "learning_rate": 7.026315789473685e-07, "loss": 0.4915, "step": 1733 }, { "epoch": 1.6599616858237547, "loss_full_dim": 0.22697453200817108, "loss_main": 0.4662289619445801, "loss_parscale": 0.47265625, "loss_sub_dim": 0.2392544150352478, "loss_vclub": 0.00109100341796875, "parscale_sim": 0.98828125, "step": 1733 }, { "epoch": 1.660919540229885, "grad_norm": 4.615904331207275, "learning_rate": 7.000000000000001e-07, "loss": 0.4662, "step": 1734 }, { "epoch": 1.660919540229885, "loss_full_dim": 0.2972922623157501, "loss_main": 0.6065285205841064, "loss_parscale": 0.62109375, "loss_sub_dim": 0.3092362880706787, "loss_vclub": 0.0007781982421875, "parscale_sim": 0.984375, "step": 1734 }, { "epoch": 1.6618773946360155, "grad_norm": 6.404580593109131, "learning_rate": 6.973684210526316e-07, "loss": 0.6065, "step": 1735 }, { "epoch": 1.6618773946360155, "loss_full_dim": 0.22210004925727844, "loss_main": 0.4546557664871216, "loss_parscale": 0.45703125, "loss_sub_dim": 0.23255571722984314, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.984375, "step": 1735 }, { "epoch": 1.6628352490421456, "grad_norm": 7.176109790802002, "learning_rate": 6.947368421052631e-07, "loss": 0.4547, "step": 1736 }, { "epoch": 1.6628352490421456, "loss_full_dim": 0.2582071125507355, "loss_main": 0.5281885862350464, "loss_parscale": 0.53125, "loss_sub_dim": 0.2699814736843109, "loss_vclub": 0.00083160400390625, "parscale_sim": 0.984375, "step": 1736 }, { "epoch": 1.6637931034482758, "grad_norm": 10.08082389831543, "learning_rate": 6.921052631578948e-07, "loss": 0.5282, "step": 1737 }, { "epoch": 1.6637931034482758, "loss_full_dim": 0.26656413078308105, "loss_main": 0.5448238253593445, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2782596945762634, "loss_vclub": 0.00103759765625, "parscale_sim": 0.984375, "step": 1737 }, { "epoch": 1.6647509578544062, "grad_norm": 7.992217063903809, "learning_rate": 6.894736842105264e-07, "loss": 0.5448, "step": 1738 }, { "epoch": 1.6647509578544062, "loss_full_dim": 0.27329838275909424, "loss_main": 0.5575627684593201, "loss_parscale": 0.56640625, "loss_sub_dim": 0.28426438570022583, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.9765625, "step": 1738 }, { "epoch": 1.6657088122605364, "grad_norm": 9.48056411743164, "learning_rate": 6.86842105263158e-07, "loss": 0.5576, "step": 1739 }, { "epoch": 1.6657088122605364, "loss_full_dim": 0.27982455492019653, "loss_main": 0.5702461004257202, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2904215455055237, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.98828125, "step": 1739 }, { "epoch": 1.6666666666666665, "grad_norm": 7.491960525512695, "learning_rate": 6.842105263157896e-07, "loss": 0.5702, "step": 1740 }, { "epoch": 1.6666666666666665, "loss_full_dim": 0.23979824781417847, "loss_main": 0.4906965494155884, "loss_parscale": 0.4921875, "loss_sub_dim": 0.2508983016014099, "loss_vclub": 0.000598907470703125, "parscale_sim": 0.984375, "step": 1740 }, { "epoch": 1.667624521072797, "grad_norm": 7.459261417388916, "learning_rate": 6.815789473684211e-07, "loss": 0.4907, "step": 1741 }, { "epoch": 1.667624521072797, "loss_full_dim": 0.2719390392303467, "loss_main": 0.5561978816986084, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2842588424682617, "loss_vclub": 0.000911712646484375, "parscale_sim": 0.984375, "step": 1741 }, { "epoch": 1.6685823754789273, "grad_norm": 7.314126491546631, "learning_rate": 6.789473684210526e-07, "loss": 0.5562, "step": 1742 }, { "epoch": 1.6685823754789273, "loss_full_dim": 0.2928670048713684, "loss_main": 0.5994343161582947, "loss_parscale": 0.59375, "loss_sub_dim": 0.30656731128692627, "loss_vclub": 0.000873565673828125, "parscale_sim": 0.98828125, "step": 1742 }, { "epoch": 1.6695402298850575, "grad_norm": 5.921130180358887, "learning_rate": 6.763157894736842e-07, "loss": 0.5994, "step": 1743 }, { "epoch": 1.6695402298850575, "loss_full_dim": 0.2967711091041565, "loss_main": 0.605220377445221, "loss_parscale": 0.60546875, "loss_sub_dim": 0.30844926834106445, "loss_vclub": 0.00096893310546875, "parscale_sim": 0.984375, "step": 1743 }, { "epoch": 1.6704980842911876, "grad_norm": 6.708566665649414, "learning_rate": 6.736842105263158e-07, "loss": 0.6052, "step": 1744 }, { "epoch": 1.6704980842911876, "loss_full_dim": 0.2608266770839691, "loss_main": 0.5333676338195801, "loss_parscale": 0.54296875, "loss_sub_dim": 0.2725409269332886, "loss_vclub": 0.000949859619140625, "parscale_sim": 0.98828125, "step": 1744 }, { "epoch": 1.671455938697318, "grad_norm": 7.581732749938965, "learning_rate": 6.710526315789475e-07, "loss": 0.5334, "step": 1745 }, { "epoch": 1.671455938697318, "loss_full_dim": 0.31889399886131287, "loss_main": 0.6493856906890869, "loss_parscale": 0.65625, "loss_sub_dim": 0.33049166202545166, "loss_vclub": 0.0011444091796875, "parscale_sim": 0.984375, "step": 1745 }, { "epoch": 1.6724137931034484, "grad_norm": 7.603579521179199, "learning_rate": 6.684210526315791e-07, "loss": 0.6494, "step": 1746 }, { "epoch": 1.6724137931034484, "loss_full_dim": 0.22857853770256042, "loss_main": 0.4675835072994232, "loss_parscale": 0.470703125, "loss_sub_dim": 0.2390049695968628, "loss_vclub": 0.0009307861328125, "parscale_sim": 0.98828125, "step": 1746 }, { "epoch": 1.6733716475095786, "grad_norm": 6.239498615264893, "learning_rate": 6.657894736842106e-07, "loss": 0.4676, "step": 1747 }, { "epoch": 1.6733716475095786, "loss_full_dim": 0.37447601556777954, "loss_main": 0.7621828317642212, "loss_parscale": 0.76953125, "loss_sub_dim": 0.38770681619644165, "loss_vclub": 0.000946044921875, "parscale_sim": 0.984375, "step": 1747 }, { "epoch": 1.6743295019157087, "grad_norm": 11.680092811584473, "learning_rate": 6.631578947368422e-07, "loss": 0.7622, "step": 1748 }, { "epoch": 1.6743295019157087, "loss_full_dim": 0.30357587337493896, "loss_main": 0.6195107102394104, "loss_parscale": 0.625, "loss_sub_dim": 0.31593483686447144, "loss_vclub": 0.0009765625, "parscale_sim": 0.984375, "step": 1748 }, { "epoch": 1.6752873563218391, "grad_norm": 6.568049907684326, "learning_rate": 6.605263157894737e-07, "loss": 0.6195, "step": 1749 }, { "epoch": 1.6752873563218391, "loss_full_dim": 0.26006391644477844, "loss_main": 0.5327848196029663, "loss_parscale": 0.53125, "loss_sub_dim": 0.27272093296051025, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.984375, "step": 1749 }, { "epoch": 1.6762452107279695, "grad_norm": 7.309226989746094, "learning_rate": 6.578947368421053e-07, "loss": 0.5328, "step": 1750 }, { "epoch": 1.6762452107279695, "loss_full_dim": 0.23684927821159363, "loss_main": 0.4841547906398773, "loss_parscale": 0.484375, "loss_sub_dim": 0.2473055124282837, "loss_vclub": 0.00098419189453125, "parscale_sim": 0.98046875, "step": 1750 }, { "epoch": 1.6772030651340997, "grad_norm": 6.990508556365967, "learning_rate": 6.552631578947369e-07, "loss": 0.4842, "step": 1751 }, { "epoch": 1.6772030651340997, "loss_full_dim": 0.2860237956047058, "loss_main": 0.5819444060325623, "loss_parscale": 0.58203125, "loss_sub_dim": 0.29592061042785645, "loss_vclub": 0.000789642333984375, "parscale_sim": 0.984375, "step": 1751 }, { "epoch": 1.6781609195402298, "grad_norm": 5.87493371963501, "learning_rate": 6.526315789473684e-07, "loss": 0.5819, "step": 1752 }, { "epoch": 1.6781609195402298, "loss_full_dim": 0.26403552293777466, "loss_main": 0.5392841696739197, "loss_parscale": 0.5390625, "loss_sub_dim": 0.275248646736145, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.984375, "step": 1752 }, { "epoch": 1.6791187739463602, "grad_norm": 5.800407409667969, "learning_rate": 6.5e-07, "loss": 0.5393, "step": 1753 }, { "epoch": 1.6791187739463602, "loss_full_dim": 0.23313376307487488, "loss_main": 0.4780712127685547, "loss_parscale": 0.4765625, "loss_sub_dim": 0.2449374496936798, "loss_vclub": 0.0009613037109375, "parscale_sim": 0.984375, "step": 1753 }, { "epoch": 1.6800766283524904, "grad_norm": 6.857458114624023, "learning_rate": 6.473684210526317e-07, "loss": 0.4781, "step": 1754 }, { "epoch": 1.6800766283524904, "loss_full_dim": 0.23659707605838776, "loss_main": 0.4844427704811096, "loss_parscale": 0.4921875, "loss_sub_dim": 0.24784567952156067, "loss_vclub": 0.0010986328125, "parscale_sim": 0.98828125, "step": 1754 }, { "epoch": 1.6810344827586206, "grad_norm": 6.848397254943848, "learning_rate": 6.447368421052633e-07, "loss": 0.4844, "step": 1755 }, { "epoch": 1.6810344827586206, "loss_full_dim": 0.27805957198143005, "loss_main": 0.5683271884918213, "loss_parscale": 0.578125, "loss_sub_dim": 0.29026758670806885, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.984375, "step": 1755 }, { "epoch": 1.681992337164751, "grad_norm": 9.316546440124512, "learning_rate": 6.421052631578948e-07, "loss": 0.5683, "step": 1756 }, { "epoch": 1.681992337164751, "loss_full_dim": 0.2825341522693634, "loss_main": 0.5752884149551392, "loss_parscale": 0.578125, "loss_sub_dim": 0.29275429248809814, "loss_vclub": 0.00092315673828125, "parscale_sim": 0.98828125, "step": 1756 }, { "epoch": 1.6829501915708813, "grad_norm": 6.2714433670043945, "learning_rate": 6.394736842105264e-07, "loss": 0.5753, "step": 1757 }, { "epoch": 1.6829501915708813, "loss_full_dim": 0.27051424980163574, "loss_main": 0.5518558621406555, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2813416123390198, "loss_vclub": 0.0011444091796875, "parscale_sim": 0.98828125, "step": 1757 }, { "epoch": 1.6839080459770115, "grad_norm": 7.185793876647949, "learning_rate": 6.368421052631579e-07, "loss": 0.5519, "step": 1758 }, { "epoch": 1.6839080459770115, "loss_full_dim": 0.2661648988723755, "loss_main": 0.5436320304870605, "loss_parscale": 0.546875, "loss_sub_dim": 0.27746713161468506, "loss_vclub": 0.00086212158203125, "parscale_sim": 0.984375, "step": 1758 }, { "epoch": 1.6848659003831417, "grad_norm": 8.086124420166016, "learning_rate": 6.342105263157895e-07, "loss": 0.5436, "step": 1759 }, { "epoch": 1.6848659003831417, "loss_full_dim": 0.2827990651130676, "loss_main": 0.5765740871429443, "loss_parscale": 0.578125, "loss_sub_dim": 0.2937750220298767, "loss_vclub": 0.000881195068359375, "parscale_sim": 0.984375, "step": 1759 }, { "epoch": 1.685823754789272, "grad_norm": 7.569667816162109, "learning_rate": 6.315789473684211e-07, "loss": 0.5766, "step": 1760 }, { "epoch": 1.685823754789272, "loss_full_dim": 0.2787226438522339, "loss_main": 0.5697012543678284, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2909786105155945, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.984375, "step": 1760 }, { "epoch": 1.6867816091954024, "grad_norm": 6.264378070831299, "learning_rate": 6.289473684210527e-07, "loss": 0.5697, "step": 1761 }, { "epoch": 1.6867816091954024, "loss_full_dim": 0.26663851737976074, "loss_main": 0.5438904762268066, "loss_parscale": 0.546875, "loss_sub_dim": 0.2772519588470459, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.984375, "step": 1761 }, { "epoch": 1.6877394636015326, "grad_norm": 6.718122482299805, "learning_rate": 6.263157894736844e-07, "loss": 0.5439, "step": 1762 }, { "epoch": 1.6877394636015326, "loss_full_dim": 0.2435539960861206, "loss_main": 0.4993220865726471, "loss_parscale": 0.50390625, "loss_sub_dim": 0.2557680904865265, "loss_vclub": 0.0012359619140625, "parscale_sim": 0.984375, "step": 1762 }, { "epoch": 1.6886973180076628, "grad_norm": 10.519811630249023, "learning_rate": 6.236842105263158e-07, "loss": 0.4993, "step": 1763 }, { "epoch": 1.6886973180076628, "loss_full_dim": 0.2590789198875427, "loss_main": 0.5290013551712036, "loss_parscale": 0.5234375, "loss_sub_dim": 0.2699224650859833, "loss_vclub": 0.00093841552734375, "parscale_sim": 0.984375, "step": 1763 }, { "epoch": 1.6896551724137931, "grad_norm": 5.453591823577881, "learning_rate": 6.210526315789474e-07, "loss": 0.529, "step": 1764 }, { "epoch": 1.6896551724137931, "loss_full_dim": 0.27652913331985474, "loss_main": 0.5641937851905823, "loss_parscale": 0.5625, "loss_sub_dim": 0.28766465187072754, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.98046875, "step": 1764 }, { "epoch": 1.6906130268199235, "grad_norm": 8.00952434539795, "learning_rate": 6.18421052631579e-07, "loss": 0.5642, "step": 1765 }, { "epoch": 1.6906130268199235, "loss_full_dim": 0.2956891655921936, "loss_main": 0.6026374101638794, "loss_parscale": 0.6015625, "loss_sub_dim": 0.3069482743740082, "loss_vclub": 0.00102996826171875, "parscale_sim": 0.984375, "step": 1765 }, { "epoch": 1.6915708812260535, "grad_norm": 7.600696563720703, "learning_rate": 6.157894736842106e-07, "loss": 0.6026, "step": 1766 }, { "epoch": 1.6915708812260535, "loss_full_dim": 0.27852532267570496, "loss_main": 0.5681198835372925, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2895945608615875, "loss_vclub": 0.0008392333984375, "parscale_sim": 0.984375, "step": 1766 }, { "epoch": 1.6925287356321839, "grad_norm": 6.771373748779297, "learning_rate": 6.131578947368422e-07, "loss": 0.5681, "step": 1767 }, { "epoch": 1.6925287356321839, "loss_full_dim": 0.27762311697006226, "loss_main": 0.567655622959137, "loss_parscale": 0.5703125, "loss_sub_dim": 0.2900325059890747, "loss_vclub": 0.00091552734375, "parscale_sim": 0.984375, "step": 1767 }, { "epoch": 1.6934865900383143, "grad_norm": 8.869318008422852, "learning_rate": 6.105263157894738e-07, "loss": 0.5677, "step": 1768 }, { "epoch": 1.6934865900383143, "loss_full_dim": 0.2573343515396118, "loss_main": 0.5266454219818115, "loss_parscale": 0.5390625, "loss_sub_dim": 0.2693111002445221, "loss_vclub": 0.00089263916015625, "parscale_sim": 0.98046875, "step": 1768 }, { "epoch": 1.6944444444444444, "grad_norm": 5.0459771156311035, "learning_rate": 6.078947368421053e-07, "loss": 0.5266, "step": 1769 }, { "epoch": 1.6944444444444444, "loss_full_dim": 0.29125237464904785, "loss_main": 0.5937061905860901, "loss_parscale": 0.59375, "loss_sub_dim": 0.30245381593704224, "loss_vclub": 0.000804901123046875, "parscale_sim": 0.9765625, "step": 1769 }, { "epoch": 1.6954022988505746, "grad_norm": 6.230727672576904, "learning_rate": 6.052631578947369e-07, "loss": 0.5937, "step": 1770 }, { "epoch": 1.6954022988505746, "loss_full_dim": 0.2755887508392334, "loss_main": 0.5625717639923096, "loss_parscale": 0.5625, "loss_sub_dim": 0.28698304295539856, "loss_vclub": 0.00095367431640625, "parscale_sim": 0.984375, "step": 1770 }, { "epoch": 1.696360153256705, "grad_norm": 7.206476211547852, "learning_rate": 6.026315789473685e-07, "loss": 0.5626, "step": 1771 }, { "epoch": 1.696360153256705, "loss_full_dim": 0.32905569672584534, "loss_main": 0.6698863506317139, "loss_parscale": 0.6640625, "loss_sub_dim": 0.3408306837081909, "loss_vclub": 0.00101470947265625, "parscale_sim": 0.984375, "step": 1771 }, { "epoch": 1.6973180076628354, "grad_norm": 8.77536392211914, "learning_rate": 6.000000000000001e-07, "loss": 0.6699, "step": 1772 }, { "epoch": 1.6973180076628354, "loss_full_dim": 0.24773859977722168, "loss_main": 0.509772539138794, "loss_parscale": 0.5078125, "loss_sub_dim": 0.2620339095592499, "loss_vclub": 0.00103759765625, "parscale_sim": 0.984375, "step": 1772 }, { "epoch": 1.6982758620689655, "grad_norm": 6.614867687225342, "learning_rate": 5.973684210526317e-07, "loss": 0.5098, "step": 1773 }, { "epoch": 1.6982758620689655, "loss_full_dim": 0.26627805829048157, "loss_main": 0.5425355434417725, "loss_parscale": 0.55078125, "loss_sub_dim": 0.2762575149536133, "loss_vclub": 0.0012054443359375, "parscale_sim": 0.98828125, "step": 1773 }, { "epoch": 1.6992337164750957, "grad_norm": 7.106132507324219, "learning_rate": 5.947368421052632e-07, "loss": 0.5425, "step": 1774 }, { "epoch": 1.6992337164750957, "loss_full_dim": 0.2630713880062103, "loss_main": 0.5373724699020386, "loss_parscale": 0.5546875, "loss_sub_dim": 0.27430111169815063, "loss_vclub": 0.000957489013671875, "parscale_sim": 0.98046875, "step": 1774 }, { "epoch": 1.700191570881226, "grad_norm": 53.64697265625, "learning_rate": 5.921052631578947e-07, "loss": 0.5374, "step": 1775 }, { "epoch": 1.700191570881226, "loss_full_dim": 0.2917274236679077, "loss_main": 0.5946029424667358, "loss_parscale": 0.59375, "loss_sub_dim": 0.3028755187988281, "loss_vclub": 0.00115203857421875, "parscale_sim": 0.984375, "step": 1775 }, { "epoch": 1.7011494252873565, "grad_norm": 4.604063510894775, "learning_rate": 5.894736842105263e-07, "loss": 0.5946, "step": 1776 }, { "epoch": 1.7011494252873565, "loss_full_dim": 0.2652106285095215, "loss_main": 0.5414621233940125, "loss_parscale": 0.5546875, "loss_sub_dim": 0.27625149488449097, "loss_vclub": 0.0010223388671875, "parscale_sim": 0.984375, "step": 1776 }, { "epoch": 1.7021072796934866, "grad_norm": 6.764899730682373, "learning_rate": 5.86842105263158e-07, "loss": 0.5415, "step": 1777 }, { "epoch": 1.7021072796934866, "loss_full_dim": 0.2876269519329071, "loss_main": 0.5860226154327393, "loss_parscale": 0.5859375, "loss_sub_dim": 0.29839569330215454, "loss_vclub": 0.0008087158203125, "parscale_sim": 0.98828125, "step": 1777 }, { "epoch": 1.7030651340996168, "grad_norm": 5.59177827835083, "learning_rate": 5.842105263157896e-07, "loss": 0.586, "step": 1778 }, { "epoch": 1.7030651340996168, "loss_full_dim": 0.2702898383140564, "loss_main": 0.5516209602355957, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2813311517238617, "loss_vclub": 0.000732421875, "parscale_sim": 0.98046875, "step": 1778 }, { "epoch": 1.7040229885057472, "grad_norm": 7.806240558624268, "learning_rate": 5.81578947368421e-07, "loss": 0.5516, "step": 1779 }, { "epoch": 1.7040229885057472, "loss_full_dim": 0.2960853576660156, "loss_main": 0.605324387550354, "loss_parscale": 0.60546875, "loss_sub_dim": 0.309239000082016, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.984375, "step": 1779 }, { "epoch": 1.7049808429118773, "grad_norm": 7.746889591217041, "learning_rate": 5.789473684210526e-07, "loss": 0.6053, "step": 1780 }, { "epoch": 1.7049808429118773, "loss_full_dim": 0.2891220152378082, "loss_main": 0.5896549224853516, "loss_parscale": 0.5859375, "loss_sub_dim": 0.30053287744522095, "loss_vclub": 0.000934600830078125, "parscale_sim": 0.98828125, "step": 1780 }, { "epoch": 1.7059386973180075, "grad_norm": 8.948284149169922, "learning_rate": 5.763157894736843e-07, "loss": 0.5897, "step": 1781 }, { "epoch": 1.7059386973180075, "loss_full_dim": 0.3015420436859131, "loss_main": 0.6167237758636475, "loss_parscale": 0.625, "loss_sub_dim": 0.315181702375412, "loss_vclub": 0.000873565673828125, "parscale_sim": 0.984375, "step": 1781 }, { "epoch": 1.706896551724138, "grad_norm": 6.452831268310547, "learning_rate": 5.736842105263158e-07, "loss": 0.6167, "step": 1782 }, { "epoch": 1.706896551724138, "loss_full_dim": 0.26725953817367554, "loss_main": 0.5461010336875916, "loss_parscale": 0.5546875, "loss_sub_dim": 0.278841495513916, "loss_vclub": 0.000823974609375, "parscale_sim": 0.984375, "step": 1782 }, { "epoch": 1.7078544061302683, "grad_norm": 4.764255523681641, "learning_rate": 5.710526315789474e-07, "loss": 0.5461, "step": 1783 }, { "epoch": 1.7078544061302683, "loss_full_dim": 0.30011120438575745, "loss_main": 0.6121444702148438, "loss_parscale": 0.6171875, "loss_sub_dim": 0.3120332956314087, "loss_vclub": 0.0008697509765625, "parscale_sim": 0.984375, "step": 1783 }, { "epoch": 1.7088122605363985, "grad_norm": 7.425631046295166, "learning_rate": 5.68421052631579e-07, "loss": 0.6121, "step": 1784 }, { "epoch": 1.7088122605363985, "loss_full_dim": 0.2654460370540619, "loss_main": 0.5414625406265259, "loss_parscale": 0.53515625, "loss_sub_dim": 0.2760164737701416, "loss_vclub": 0.00104522705078125, "parscale_sim": 0.98046875, "step": 1784 }, { "epoch": 1.7097701149425286, "grad_norm": 7.603494167327881, "learning_rate": 5.657894736842106e-07, "loss": 0.5415, "step": 1785 }, { "epoch": 1.7097701149425286, "loss_full_dim": 0.25905704498291016, "loss_main": 0.527397871017456, "loss_parscale": 0.53125, "loss_sub_dim": 0.2683408260345459, "loss_vclub": 0.0009765625, "parscale_sim": 0.98046875, "step": 1785 }, { "epoch": 1.710727969348659, "grad_norm": 8.147363662719727, "learning_rate": 5.631578947368421e-07, "loss": 0.5274, "step": 1786 }, { "epoch": 1.710727969348659, "loss_full_dim": 0.2684365510940552, "loss_main": 0.5475740432739258, "loss_parscale": 0.5546875, "loss_sub_dim": 0.2791374921798706, "loss_vclub": 0.001129150390625, "parscale_sim": 0.984375, "step": 1786 }, { "epoch": 1.7116858237547894, "grad_norm": 6.350757122039795, "learning_rate": 5.605263157894737e-07, "loss": 0.5476, "step": 1787 }, { "epoch": 1.7116858237547894, "loss_full_dim": 0.25423261523246765, "loss_main": 0.5209883451461792, "loss_parscale": 0.5234375, "loss_sub_dim": 0.26675575971603394, "loss_vclub": 0.00077056884765625, "parscale_sim": 0.984375, "step": 1787 }, { "epoch": 1.7126436781609196, "grad_norm": 6.242395401000977, "learning_rate": 5.578947368421053e-07, "loss": 0.521, "step": 1788 }, { "epoch": 1.7126436781609196, "loss_full_dim": 0.2416418045759201, "loss_main": 0.49546539783477783, "loss_parscale": 0.50390625, "loss_sub_dim": 0.2538236081600189, "loss_vclub": 0.001007080078125, "parscale_sim": 0.984375, "step": 1788 }, { "epoch": 1.7136015325670497, "grad_norm": 5.176364421844482, "learning_rate": 5.55263157894737e-07, "loss": 0.4955, "step": 1789 }, { "epoch": 1.7136015325670497, "loss_full_dim": 0.23512637615203857, "loss_main": 0.48301202058792114, "loss_parscale": 0.4921875, "loss_sub_dim": 0.24788565933704376, "loss_vclub": 0.000782012939453125, "parscale_sim": 0.96875, "step": 1789 }, { "epoch": 1.71455938697318, "grad_norm": 7.017070293426514, "learning_rate": 5.526315789473684e-07, "loss": 0.483, "step": 1790 }, { "epoch": 1.71455938697318, "loss_full_dim": 0.2519604563713074, "loss_main": 0.5153846144676208, "loss_parscale": 0.515625, "loss_sub_dim": 0.2634241580963135, "loss_vclub": 0.00103759765625, "parscale_sim": 0.98828125, "step": 1790 }, { "epoch": 1.7155172413793105, "grad_norm": 5.350017547607422, "learning_rate": 5.5e-07, "loss": 0.5154, "step": 1791 }, { "epoch": 1.7155172413793105, "loss_full_dim": 0.28255942463874817, "loss_main": 0.5769266486167908, "loss_parscale": 0.578125, "loss_sub_dim": 0.2943672239780426, "loss_vclub": 0.000766754150390625, "parscale_sim": 0.98046875, "step": 1791 }, { "epoch": 1.7164750957854407, "grad_norm": 7.774301528930664, "learning_rate": 5.473684210526316e-07, "loss": 0.5769, "step": 1792 }, { "epoch": 1.7164750957854407, "loss_full_dim": 0.23226508498191833, "loss_main": 0.4754698872566223, "loss_parscale": 0.48046875, "loss_sub_dim": 0.24320480227470398, "loss_vclub": 0.0009918212890625, "parscale_sim": 0.984375, "step": 1792 }, { "epoch": 1.7174329501915708, "grad_norm": 6.957308292388916, "learning_rate": 5.447368421052632e-07, "loss": 0.4755, "step": 1793 }, { "epoch": 1.7174329501915708, "loss_full_dim": 0.28874465823173523, "loss_main": 0.5889880657196045, "loss_parscale": 0.59375, "loss_sub_dim": 0.30024343729019165, "loss_vclub": 0.0010528564453125, "parscale_sim": 0.98828125, "step": 1793 }, { "epoch": 1.7183908045977012, "grad_norm": 7.239353656768799, "learning_rate": 5.421052631578948e-07, "loss": 0.589, "step": 1794 }, { "epoch": 1.7183908045977012, "loss_full_dim": 0.22177042067050934, "loss_main": 0.455802857875824, "loss_parscale": 0.45703125, "loss_sub_dim": 0.23403245210647583, "loss_vclub": 0.0008392333984375, "parscale_sim": 0.984375, "step": 1794 }, { "epoch": 1.7193486590038314, "grad_norm": 6.337100505828857, "learning_rate": 5.394736842105264e-07, "loss": 0.4558, "step": 1795 }, { "epoch": 1.7193486590038314, "loss_full_dim": 0.28743019700050354, "loss_main": 0.586164653301239, "loss_parscale": 0.58984375, "loss_sub_dim": 0.2987344563007355, "loss_vclub": 0.00087738037109375, "parscale_sim": 0.9765625, "step": 1795 }, { "epoch": 1.7203065134099615, "grad_norm": 6.631336688995361, "learning_rate": 5.368421052631579e-07, "loss": 0.5862, "step": 1796 }, { "epoch": 1.7203065134099615, "loss_full_dim": 0.2640625834465027, "loss_main": 0.5408869981765747, "loss_parscale": 0.54296875, "loss_sub_dim": 0.276824414730072, "loss_vclub": 0.00093841552734375, "parscale_sim": 0.984375, "step": 1796 }, { "epoch": 1.721264367816092, "grad_norm": 6.094582557678223, "learning_rate": 5.342105263157895e-07, "loss": 0.5409, "step": 1797 }, { "epoch": 1.721264367816092, "loss_full_dim": 0.2515406310558319, "loss_main": 0.5136065483093262, "loss_parscale": 0.515625, "loss_sub_dim": 0.2620658874511719, "loss_vclub": 0.0009002685546875, "parscale_sim": 0.984375, "step": 1797 }, { "epoch": 1.7222222222222223, "grad_norm": 6.854114055633545, "learning_rate": 5.315789473684211e-07, "loss": 0.5136, "step": 1798 }, { "epoch": 1.7222222222222223, "loss_full_dim": 0.2642092704772949, "loss_main": 0.539729654788971, "loss_parscale": 0.54296875, "loss_sub_dim": 0.275520384311676, "loss_vclub": 0.000843048095703125, "parscale_sim": 0.984375, "step": 1798 }, { "epoch": 1.7231800766283525, "grad_norm": 6.055672645568848, "learning_rate": 5.289473684210527e-07, "loss": 0.5397, "step": 1799 }, { "epoch": 1.7231800766283525, "loss_full_dim": 0.26997628808021545, "loss_main": 0.5509346723556519, "loss_parscale": 0.546875, "loss_sub_dim": 0.2809584140777588, "loss_vclub": 0.0010833740234375, "parscale_sim": 0.9765625, "step": 1799 }, { "epoch": 1.7241379310344827, "grad_norm": 9.89507007598877, "learning_rate": 5.263157894736843e-07, "loss": 0.5509, "step": 1800 } ], "logging_steps": 1, "max_steps": 2000, "num_input_tokens_seen": 0, "num_train_epochs": 2, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 0.0, "train_batch_size": 16, "trial_name": null, "trial_params": null }