{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 2.3710729104919976, "eval_steps": 500, "global_step": 20000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "contrastive_loss": 6.933349609375, "epoch": 0, "mse_loss": 1.020828127861023, "step": 0 }, { "epoch": 0.0011855364552459987, "grad_norm": 9.875, "learning_rate": 4.5e-07, "loss": 2.2695, "step": 10 }, { "contrastive_loss": 6.933837890625, "epoch": 0.0011855364552459987, "mse_loss": 0.8299199342727661, "step": 10 }, { "epoch": 0.0023710729104919974, "grad_norm": 7.1875, "learning_rate": 9.5e-07, "loss": 2.2796, "step": 20 }, { "contrastive_loss": 6.931396484375, "epoch": 0.0023710729104919974, "mse_loss": 1.202926516532898, "step": 20 }, { "epoch": 0.0035566093657379964, "grad_norm": 6.84375, "learning_rate": 1.45e-06, "loss": 2.3447, "step": 30 }, { "contrastive_loss": 6.939697265625, "epoch": 0.0035566093657379964, "mse_loss": 0.7193194627761841, "step": 30 }, { "epoch": 0.004742145820983995, "grad_norm": 8.9375, "learning_rate": 1.95e-06, "loss": 2.2711, "step": 40 }, { "contrastive_loss": 6.922607421875, "epoch": 0.004742145820983995, "mse_loss": 1.0706291198730469, "step": 40 }, { "epoch": 0.005927682276229994, "grad_norm": 6.96875, "learning_rate": 2.4500000000000003e-06, "loss": 2.2353, "step": 50 }, { "contrastive_loss": 6.944091796875, "epoch": 0.005927682276229994, "mse_loss": 0.7509883046150208, "step": 50 }, { "epoch": 0.007113218731475993, "grad_norm": 6.375, "learning_rate": 2.95e-06, "loss": 2.2351, "step": 60 }, { "contrastive_loss": 6.933349609375, "epoch": 0.007113218731475993, "mse_loss": 0.7211111783981323, "step": 60 }, { "epoch": 0.008298755186721992, "grad_norm": 6.21875, "learning_rate": 3.4500000000000004e-06, "loss": 2.1503, "step": 70 }, { "contrastive_loss": 6.935302734375, "epoch": 0.008298755186721992, "mse_loss": 0.7233139872550964, "step": 70 }, { "epoch": 0.00948429164196799, "grad_norm": 5.40625, "learning_rate": 3.95e-06, "loss": 2.1994, "step": 80 }, { "contrastive_loss": 6.92333984375, "epoch": 0.00948429164196799, "mse_loss": 0.8511930704116821, "step": 80 }, { "epoch": 0.01066982809721399, "grad_norm": 4.625, "learning_rate": 4.45e-06, "loss": 2.0576, "step": 90 }, { "contrastive_loss": 6.931884765625, "epoch": 0.01066982809721399, "mse_loss": 0.6933262944221497, "step": 90 }, { "epoch": 0.011855364552459988, "grad_norm": 4.59375, "learning_rate": 4.950000000000001e-06, "loss": 2.0661, "step": 100 }, { "contrastive_loss": 6.895751953125, "epoch": 0.011855364552459988, "mse_loss": 0.6859448552131653, "step": 100 }, { "epoch": 0.013040901007705987, "grad_norm": 2.859375, "learning_rate": 5.45e-06, "loss": 1.9999, "step": 110 }, { "contrastive_loss": 6.904541015625, "epoch": 0.013040901007705987, "mse_loss": 0.5288821458816528, "step": 110 }, { "epoch": 0.014226437462951986, "grad_norm": 2.578125, "learning_rate": 5.95e-06, "loss": 1.9516, "step": 120 }, { "contrastive_loss": 6.877685546875, "epoch": 0.014226437462951986, "mse_loss": 0.7619789838790894, "step": 120 }, { "epoch": 0.015411973918197985, "grad_norm": 2.6875, "learning_rate": 6.45e-06, "loss": 1.9297, "step": 130 }, { "contrastive_loss": 6.8720703125, "epoch": 0.015411973918197985, "mse_loss": 0.4591713547706604, "step": 130 }, { "epoch": 0.016597510373443983, "grad_norm": 2.234375, "learning_rate": 6.950000000000001e-06, "loss": 1.8561, "step": 140 }, { "contrastive_loss": 6.829833984375, "epoch": 0.016597510373443983, "mse_loss": 0.5009814500808716, "step": 140 }, { "epoch": 0.01778304682868998, "grad_norm": 1.7734375, "learning_rate": 7.45e-06, "loss": 1.8329, "step": 150 }, { "contrastive_loss": 6.8056640625, "epoch": 0.01778304682868998, "mse_loss": 0.4036082625389099, "step": 150 }, { "epoch": 0.01896858328393598, "grad_norm": 2.46875, "learning_rate": 7.95e-06, "loss": 1.7599, "step": 160 }, { "contrastive_loss": 6.723388671875, "epoch": 0.01896858328393598, "mse_loss": 0.3842712938785553, "step": 160 }, { "epoch": 0.02015411973918198, "grad_norm": 2.234375, "learning_rate": 8.45e-06, "loss": 1.7358, "step": 170 }, { "contrastive_loss": 6.695556640625, "epoch": 0.02015411973918198, "mse_loss": 0.3864764869213104, "step": 170 }, { "epoch": 0.02133965619442798, "grad_norm": 2.109375, "learning_rate": 8.95e-06, "loss": 1.7205, "step": 180 }, { "contrastive_loss": 6.630615234375, "epoch": 0.02133965619442798, "mse_loss": 0.4381197392940521, "step": 180 }, { "epoch": 0.022525192649673977, "grad_norm": 1.828125, "learning_rate": 9.450000000000001e-06, "loss": 1.6637, "step": 190 }, { "contrastive_loss": 6.393310546875, "epoch": 0.022525192649673977, "mse_loss": 0.34406110644340515, "step": 190 }, { "epoch": 0.023710729104919975, "grad_norm": 1.890625, "learning_rate": 9.950000000000001e-06, "loss": 1.6164, "step": 200 }, { "contrastive_loss": 6.17431640625, "epoch": 0.023710729104919975, "mse_loss": 0.3520837724208832, "step": 200 }, { "epoch": 0.024896265560165973, "grad_norm": 1.515625, "learning_rate": 1.045e-05, "loss": 1.5783, "step": 210 }, { "contrastive_loss": 6.054443359375, "epoch": 0.024896265560165973, "mse_loss": 0.3267422318458557, "step": 210 }, { "epoch": 0.026081802015411975, "grad_norm": 1.59375, "learning_rate": 1.095e-05, "loss": 1.5356, "step": 220 }, { "contrastive_loss": 5.95458984375, "epoch": 0.026081802015411975, "mse_loss": 0.30424055457115173, "step": 220 }, { "epoch": 0.027267338470657973, "grad_norm": 2.78125, "learning_rate": 1.145e-05, "loss": 1.4937, "step": 230 }, { "contrastive_loss": 5.92431640625, "epoch": 0.027267338470657973, "mse_loss": 0.2958686649799347, "step": 230 }, { "epoch": 0.02845287492590397, "grad_norm": 1.3671875, "learning_rate": 1.195e-05, "loss": 1.4684, "step": 240 }, { "contrastive_loss": 5.811767578125, "epoch": 0.02845287492590397, "mse_loss": 0.3790566921234131, "step": 240 }, { "epoch": 0.02963841138114997, "grad_norm": 1.5859375, "learning_rate": 1.2450000000000001e-05, "loss": 1.452, "step": 250 }, { "contrastive_loss": 5.767578125, "epoch": 0.02963841138114997, "mse_loss": 0.3338494896888733, "step": 250 }, { "epoch": 0.03082394783639597, "grad_norm": 1.6640625, "learning_rate": 1.2950000000000001e-05, "loss": 1.4351, "step": 260 }, { "contrastive_loss": 5.719482421875, "epoch": 0.03082394783639597, "mse_loss": 0.27089783549308777, "step": 260 }, { "epoch": 0.032009484291641965, "grad_norm": 1.6875, "learning_rate": 1.3450000000000002e-05, "loss": 1.4292, "step": 270 }, { "contrastive_loss": 5.584228515625, "epoch": 0.032009484291641965, "mse_loss": 0.315051406621933, "step": 270 }, { "epoch": 0.03319502074688797, "grad_norm": 1.734375, "learning_rate": 1.3950000000000002e-05, "loss": 1.3852, "step": 280 }, { "contrastive_loss": 5.4619140625, "epoch": 0.03319502074688797, "mse_loss": 0.2666993737220764, "step": 280 }, { "epoch": 0.03438055720213397, "grad_norm": 3.203125, "learning_rate": 1.4449999999999999e-05, "loss": 1.368, "step": 290 }, { "contrastive_loss": 5.459228515625, "epoch": 0.03438055720213397, "mse_loss": 0.30442720651626587, "step": 290 }, { "epoch": 0.03556609365737996, "grad_norm": 2.203125, "learning_rate": 1.4950000000000001e-05, "loss": 1.3462, "step": 300 }, { "contrastive_loss": 5.344482421875, "epoch": 0.03556609365737996, "mse_loss": 0.35500937700271606, "step": 300 }, { "epoch": 0.036751630112625965, "grad_norm": 1.421875, "learning_rate": 1.545e-05, "loss": 1.3515, "step": 310 }, { "contrastive_loss": 5.41064453125, "epoch": 0.036751630112625965, "mse_loss": 0.23119105398654938, "step": 310 }, { "epoch": 0.03793716656787196, "grad_norm": 2.234375, "learning_rate": 1.595e-05, "loss": 1.3092, "step": 320 }, { "contrastive_loss": 5.346923828125, "epoch": 0.03793716656787196, "mse_loss": 0.2441517412662506, "step": 320 }, { "epoch": 0.03912270302311796, "grad_norm": 1.6015625, "learning_rate": 1.645e-05, "loss": 1.3165, "step": 330 }, { "contrastive_loss": 5.1787109375, "epoch": 0.03912270302311796, "mse_loss": 0.2166583091020584, "step": 330 }, { "epoch": 0.04030823947836396, "grad_norm": 1.375, "learning_rate": 1.6950000000000002e-05, "loss": 1.2874, "step": 340 }, { "contrastive_loss": 5.24365234375, "epoch": 0.04030823947836396, "mse_loss": 0.24041740596294403, "step": 340 }, { "epoch": 0.04149377593360996, "grad_norm": 1.84375, "learning_rate": 1.745e-05, "loss": 1.2735, "step": 350 }, { "contrastive_loss": 5.25732421875, "epoch": 0.04149377593360996, "mse_loss": 0.2684544026851654, "step": 350 }, { "epoch": 0.04267931238885596, "grad_norm": 1.484375, "learning_rate": 1.795e-05, "loss": 1.2573, "step": 360 }, { "contrastive_loss": 5.097900390625, "epoch": 0.04267931238885596, "mse_loss": 0.26131823658943176, "step": 360 }, { "epoch": 0.04386484884410195, "grad_norm": 2.8125, "learning_rate": 1.845e-05, "loss": 1.2507, "step": 370 }, { "contrastive_loss": 5.31591796875, "epoch": 0.04386484884410195, "mse_loss": 0.22671115398406982, "step": 370 }, { "epoch": 0.045050385299347954, "grad_norm": 1.9140625, "learning_rate": 1.895e-05, "loss": 1.2557, "step": 380 }, { "contrastive_loss": 5.11962890625, "epoch": 0.045050385299347954, "mse_loss": 0.20279158651828766, "step": 380 }, { "epoch": 0.046235921754593956, "grad_norm": 1.359375, "learning_rate": 1.9450000000000002e-05, "loss": 1.2441, "step": 390 }, { "contrastive_loss": 5.0191650390625, "epoch": 0.046235921754593956, "mse_loss": 0.20302759110927582, "step": 390 }, { "epoch": 0.04742145820983995, "grad_norm": 2.265625, "learning_rate": 1.995e-05, "loss": 1.2388, "step": 400 }, { "contrastive_loss": 4.939208984375, "epoch": 0.04742145820983995, "mse_loss": 0.18910615146160126, "step": 400 }, { "epoch": 0.04860699466508595, "grad_norm": 1.6484375, "learning_rate": 2.045e-05, "loss": 1.2331, "step": 410 }, { "contrastive_loss": 5.063232421875, "epoch": 0.04860699466508595, "mse_loss": 0.23153099417686462, "step": 410 }, { "epoch": 0.04979253112033195, "grad_norm": 2.546875, "learning_rate": 2.095e-05, "loss": 1.2223, "step": 420 }, { "contrastive_loss": 4.89599609375, "epoch": 0.04979253112033195, "mse_loss": 0.1945224553346634, "step": 420 }, { "epoch": 0.05097806757557795, "grad_norm": 1.6484375, "learning_rate": 2.145e-05, "loss": 1.2015, "step": 430 }, { "contrastive_loss": 4.9874267578125, "epoch": 0.05097806757557795, "mse_loss": 0.21720878779888153, "step": 430 }, { "epoch": 0.05216360403082395, "grad_norm": 3.5625, "learning_rate": 2.195e-05, "loss": 1.2165, "step": 440 }, { "contrastive_loss": 4.961669921875, "epoch": 0.05216360403082395, "mse_loss": 0.19037406146526337, "step": 440 }, { "epoch": 0.053349140486069944, "grad_norm": 1.5078125, "learning_rate": 2.245e-05, "loss": 1.1949, "step": 450 }, { "contrastive_loss": 5.04443359375, "epoch": 0.053349140486069944, "mse_loss": 0.2131185680627823, "step": 450 }, { "epoch": 0.054534676941315946, "grad_norm": 2.359375, "learning_rate": 2.2950000000000002e-05, "loss": 1.2021, "step": 460 }, { "contrastive_loss": 4.8563232421875, "epoch": 0.054534676941315946, "mse_loss": 0.24933679401874542, "step": 460 }, { "epoch": 0.05572021339656195, "grad_norm": 1.328125, "learning_rate": 2.345e-05, "loss": 1.1901, "step": 470 }, { "contrastive_loss": 4.9130859375, "epoch": 0.05572021339656195, "mse_loss": 0.2124623954296112, "step": 470 }, { "epoch": 0.05690574985180794, "grad_norm": 1.9296875, "learning_rate": 2.395e-05, "loss": 1.1849, "step": 480 }, { "contrastive_loss": 4.7525634765625, "epoch": 0.05690574985180794, "mse_loss": 0.20945003628730774, "step": 480 }, { "epoch": 0.058091286307053944, "grad_norm": 2.25, "learning_rate": 2.445e-05, "loss": 1.1672, "step": 490 }, { "contrastive_loss": 4.781494140625, "epoch": 0.058091286307053944, "mse_loss": 0.18707378208637238, "step": 490 }, { "epoch": 0.05927682276229994, "grad_norm": 1.6484375, "learning_rate": 2.495e-05, "loss": 1.1761, "step": 500 }, { "contrastive_loss": 4.911865234375, "epoch": 0.05927682276229994, "mse_loss": 0.2479414939880371, "step": 500 }, { "epoch": 0.06046235921754594, "grad_norm": 2.453125, "learning_rate": 2.5450000000000002e-05, "loss": 1.1713, "step": 510 }, { "contrastive_loss": 4.930908203125, "epoch": 0.06046235921754594, "mse_loss": 0.1973489671945572, "step": 510 }, { "epoch": 0.06164789567279194, "grad_norm": 1.828125, "learning_rate": 2.595e-05, "loss": 1.1707, "step": 520 }, { "contrastive_loss": 4.7442626953125, "epoch": 0.06164789567279194, "mse_loss": 0.17603302001953125, "step": 520 }, { "epoch": 0.06283343212803794, "grad_norm": 1.9765625, "learning_rate": 2.6450000000000003e-05, "loss": 1.169, "step": 530 }, { "contrastive_loss": 4.9310302734375, "epoch": 0.06283343212803794, "mse_loss": 0.17854173481464386, "step": 530 }, { "epoch": 0.06401896858328393, "grad_norm": 1.453125, "learning_rate": 2.6950000000000005e-05, "loss": 1.1427, "step": 540 }, { "contrastive_loss": 4.9222412109375, "epoch": 0.06401896858328393, "mse_loss": 0.16019365191459656, "step": 540 }, { "epoch": 0.06520450503852994, "grad_norm": 2.5, "learning_rate": 2.7450000000000003e-05, "loss": 1.1558, "step": 550 }, { "contrastive_loss": 4.8341064453125, "epoch": 0.06520450503852994, "mse_loss": 0.1831035614013672, "step": 550 }, { "epoch": 0.06639004149377593, "grad_norm": 1.5234375, "learning_rate": 2.7950000000000005e-05, "loss": 1.1147, "step": 560 }, { "contrastive_loss": 4.730712890625, "epoch": 0.06639004149377593, "mse_loss": 0.17598488926887512, "step": 560 }, { "epoch": 0.06757557794902193, "grad_norm": 1.4921875, "learning_rate": 2.845e-05, "loss": 1.126, "step": 570 }, { "contrastive_loss": 4.8433837890625, "epoch": 0.06757557794902193, "mse_loss": 0.18251855671405792, "step": 570 }, { "epoch": 0.06876111440426794, "grad_norm": 1.796875, "learning_rate": 2.895e-05, "loss": 1.1258, "step": 580 }, { "contrastive_loss": 4.629150390625, "epoch": 0.06876111440426794, "mse_loss": 0.19276496767997742, "step": 580 }, { "epoch": 0.06994665085951393, "grad_norm": 1.625, "learning_rate": 2.945e-05, "loss": 1.134, "step": 590 }, { "contrastive_loss": 4.72900390625, "epoch": 0.06994665085951393, "mse_loss": 0.19505956768989563, "step": 590 }, { "epoch": 0.07113218731475993, "grad_norm": 1.5546875, "learning_rate": 2.995e-05, "loss": 1.1304, "step": 600 }, { "contrastive_loss": 4.69140625, "epoch": 0.07113218731475993, "mse_loss": 0.19534291326999664, "step": 600 }, { "epoch": 0.07231772377000593, "grad_norm": 1.3515625, "learning_rate": 3.045e-05, "loss": 1.1254, "step": 610 }, { "contrastive_loss": 4.65576171875, "epoch": 0.07231772377000593, "mse_loss": 0.18933293223381042, "step": 610 }, { "epoch": 0.07350326022525193, "grad_norm": 1.9765625, "learning_rate": 3.095e-05, "loss": 1.1247, "step": 620 }, { "contrastive_loss": 4.776123046875, "epoch": 0.07350326022525193, "mse_loss": 0.18707619607448578, "step": 620 }, { "epoch": 0.07468879668049792, "grad_norm": 1.4296875, "learning_rate": 3.145e-05, "loss": 1.1107, "step": 630 }, { "contrastive_loss": 4.71923828125, "epoch": 0.07468879668049792, "mse_loss": 0.14242276549339294, "step": 630 }, { "epoch": 0.07587433313574392, "grad_norm": 1.40625, "learning_rate": 3.1950000000000004e-05, "loss": 1.1114, "step": 640 }, { "contrastive_loss": 4.6484375, "epoch": 0.07587433313574392, "mse_loss": 0.19214288890361786, "step": 640 }, { "epoch": 0.07705986959098993, "grad_norm": 1.859375, "learning_rate": 3.245e-05, "loss": 1.1215, "step": 650 }, { "contrastive_loss": 4.611328125, "epoch": 0.07705986959098993, "mse_loss": 0.1549609899520874, "step": 650 }, { "epoch": 0.07824540604623592, "grad_norm": 2.453125, "learning_rate": 3.295e-05, "loss": 1.1034, "step": 660 }, { "contrastive_loss": 4.6693115234375, "epoch": 0.07824540604623592, "mse_loss": 0.15536080300807953, "step": 660 }, { "epoch": 0.07943094250148192, "grad_norm": 2.09375, "learning_rate": 3.345000000000001e-05, "loss": 1.1208, "step": 670 }, { "contrastive_loss": 4.57470703125, "epoch": 0.07943094250148192, "mse_loss": 0.17876751720905304, "step": 670 }, { "epoch": 0.08061647895672792, "grad_norm": 3.625, "learning_rate": 3.3950000000000005e-05, "loss": 1.1036, "step": 680 }, { "contrastive_loss": 4.4874267578125, "epoch": 0.08061647895672792, "mse_loss": 0.18046358227729797, "step": 680 }, { "epoch": 0.08180201541197392, "grad_norm": 1.5859375, "learning_rate": 3.445e-05, "loss": 1.1089, "step": 690 }, { "contrastive_loss": 4.650146484375, "epoch": 0.08180201541197392, "mse_loss": 0.1482270509004593, "step": 690 }, { "epoch": 0.08298755186721991, "grad_norm": 1.421875, "learning_rate": 3.495e-05, "loss": 1.0869, "step": 700 }, { "contrastive_loss": 4.6461181640625, "epoch": 0.08298755186721991, "mse_loss": 0.15026690065860748, "step": 700 }, { "epoch": 0.08417308832246592, "grad_norm": 1.5390625, "learning_rate": 3.545e-05, "loss": 1.1057, "step": 710 }, { "contrastive_loss": 4.609619140625, "epoch": 0.08417308832246592, "mse_loss": 0.17840172350406647, "step": 710 }, { "epoch": 0.08535862477771192, "grad_norm": 1.4453125, "learning_rate": 3.595e-05, "loss": 1.0833, "step": 720 }, { "contrastive_loss": 4.51708984375, "epoch": 0.08535862477771192, "mse_loss": 0.20048737525939941, "step": 720 }, { "epoch": 0.08654416123295791, "grad_norm": 2.4375, "learning_rate": 3.645e-05, "loss": 1.0877, "step": 730 }, { "contrastive_loss": 4.65966796875, "epoch": 0.08654416123295791, "mse_loss": 0.13850751519203186, "step": 730 }, { "epoch": 0.0877296976882039, "grad_norm": 1.953125, "learning_rate": 3.6950000000000004e-05, "loss": 1.0729, "step": 740 }, { "contrastive_loss": 4.5433349609375, "epoch": 0.0877296976882039, "mse_loss": 0.12611888349056244, "step": 740 }, { "epoch": 0.08891523414344991, "grad_norm": 1.5859375, "learning_rate": 3.745e-05, "loss": 1.0725, "step": 750 }, { "contrastive_loss": 4.646728515625, "epoch": 0.08891523414344991, "mse_loss": 0.1584591418504715, "step": 750 }, { "epoch": 0.09010077059869591, "grad_norm": 1.4921875, "learning_rate": 3.795e-05, "loss": 1.0698, "step": 760 }, { "contrastive_loss": 4.52783203125, "epoch": 0.09010077059869591, "mse_loss": 0.13924750685691833, "step": 760 }, { "epoch": 0.0912863070539419, "grad_norm": 1.5859375, "learning_rate": 3.845e-05, "loss": 1.0589, "step": 770 }, { "contrastive_loss": 4.6591796875, "epoch": 0.0912863070539419, "mse_loss": 0.14962004125118256, "step": 770 }, { "epoch": 0.09247184350918791, "grad_norm": 2.265625, "learning_rate": 3.8950000000000005e-05, "loss": 1.0862, "step": 780 }, { "contrastive_loss": 4.6407470703125, "epoch": 0.09247184350918791, "mse_loss": 0.1839859038591385, "step": 780 }, { "epoch": 0.0936573799644339, "grad_norm": 1.7578125, "learning_rate": 3.9450000000000003e-05, "loss": 1.0844, "step": 790 }, { "contrastive_loss": 4.6689453125, "epoch": 0.0936573799644339, "mse_loss": 0.13388986885547638, "step": 790 }, { "epoch": 0.0948429164196799, "grad_norm": 1.984375, "learning_rate": 3.995e-05, "loss": 1.053, "step": 800 }, { "contrastive_loss": 4.535400390625, "epoch": 0.0948429164196799, "mse_loss": 0.1562316119670868, "step": 800 }, { "epoch": 0.09602845287492591, "grad_norm": 1.078125, "learning_rate": 4.045000000000001e-05, "loss": 1.0654, "step": 810 }, { "contrastive_loss": 4.5404052734375, "epoch": 0.09602845287492591, "mse_loss": 0.12796232104301453, "step": 810 }, { "epoch": 0.0972139893301719, "grad_norm": 1.75, "learning_rate": 4.095e-05, "loss": 1.0653, "step": 820 }, { "contrastive_loss": 4.650390625, "epoch": 0.0972139893301719, "mse_loss": 0.13285325467586517, "step": 820 }, { "epoch": 0.0983995257854179, "grad_norm": 1.6015625, "learning_rate": 4.145e-05, "loss": 1.0645, "step": 830 }, { "contrastive_loss": 4.5380859375, "epoch": 0.0983995257854179, "mse_loss": 0.15655764937400818, "step": 830 }, { "epoch": 0.0995850622406639, "grad_norm": 1.3671875, "learning_rate": 4.195e-05, "loss": 1.0388, "step": 840 }, { "contrastive_loss": 4.5191650390625, "epoch": 0.0995850622406639, "mse_loss": 0.14153768122196198, "step": 840 }, { "epoch": 0.1007705986959099, "grad_norm": 1.7734375, "learning_rate": 4.245e-05, "loss": 1.0851, "step": 850 }, { "contrastive_loss": 4.5848388671875, "epoch": 0.1007705986959099, "mse_loss": 0.13734504580497742, "step": 850 }, { "epoch": 0.1019561351511559, "grad_norm": 1.453125, "learning_rate": 4.295e-05, "loss": 1.0616, "step": 860 }, { "contrastive_loss": 4.4615478515625, "epoch": 0.1019561351511559, "mse_loss": 0.10722164809703827, "step": 860 }, { "epoch": 0.10314167160640189, "grad_norm": 1.40625, "learning_rate": 4.345e-05, "loss": 1.0505, "step": 870 }, { "contrastive_loss": 4.420166015625, "epoch": 0.10314167160640189, "mse_loss": 0.13786707818508148, "step": 870 }, { "epoch": 0.1043272080616479, "grad_norm": 1.46875, "learning_rate": 4.3950000000000004e-05, "loss": 1.0403, "step": 880 }, { "contrastive_loss": 4.5147705078125, "epoch": 0.1043272080616479, "mse_loss": 0.14357486367225647, "step": 880 }, { "epoch": 0.1055127445168939, "grad_norm": 1.5546875, "learning_rate": 4.445e-05, "loss": 1.0386, "step": 890 }, { "contrastive_loss": 4.4693603515625, "epoch": 0.1055127445168939, "mse_loss": 0.12314682453870773, "step": 890 }, { "epoch": 0.10669828097213989, "grad_norm": 1.3671875, "learning_rate": 4.495e-05, "loss": 1.0469, "step": 900 }, { "contrastive_loss": 4.501220703125, "epoch": 0.10669828097213989, "mse_loss": 0.17460396885871887, "step": 900 }, { "epoch": 0.1078838174273859, "grad_norm": 1.6171875, "learning_rate": 4.545000000000001e-05, "loss": 1.0425, "step": 910 }, { "contrastive_loss": 4.567138671875, "epoch": 0.1078838174273859, "mse_loss": 0.13012012839317322, "step": 910 }, { "epoch": 0.10906935388263189, "grad_norm": 1.3828125, "learning_rate": 4.5950000000000006e-05, "loss": 1.0329, "step": 920 }, { "contrastive_loss": 4.646240234375, "epoch": 0.10906935388263189, "mse_loss": 0.1588732749223709, "step": 920 }, { "epoch": 0.11025489033787789, "grad_norm": 1.515625, "learning_rate": 4.6450000000000004e-05, "loss": 1.0411, "step": 930 }, { "contrastive_loss": 4.551513671875, "epoch": 0.11025489033787789, "mse_loss": 0.12044618278741837, "step": 930 }, { "epoch": 0.1114404267931239, "grad_norm": 2.78125, "learning_rate": 4.695e-05, "loss": 1.0341, "step": 940 }, { "contrastive_loss": 4.5450439453125, "epoch": 0.1114404267931239, "mse_loss": 0.17043618857860565, "step": 940 }, { "epoch": 0.11262596324836989, "grad_norm": 1.671875, "learning_rate": 4.745e-05, "loss": 1.0471, "step": 950 }, { "contrastive_loss": 4.4482421875, "epoch": 0.11262596324836989, "mse_loss": 0.19017429649829865, "step": 950 }, { "epoch": 0.11381149970361588, "grad_norm": 1.1171875, "learning_rate": 4.795e-05, "loss": 1.0383, "step": 960 }, { "contrastive_loss": 4.566162109375, "epoch": 0.11381149970361588, "mse_loss": 0.19182585179805756, "step": 960 }, { "epoch": 0.11499703615886188, "grad_norm": 1.21875, "learning_rate": 4.845e-05, "loss": 1.0264, "step": 970 }, { "contrastive_loss": 4.41259765625, "epoch": 0.11499703615886188, "mse_loss": 0.1645308881998062, "step": 970 }, { "epoch": 0.11618257261410789, "grad_norm": 1.6171875, "learning_rate": 4.8950000000000004e-05, "loss": 1.0349, "step": 980 }, { "contrastive_loss": 4.3712158203125, "epoch": 0.11618257261410789, "mse_loss": 0.13010339438915253, "step": 980 }, { "epoch": 0.11736810906935388, "grad_norm": 1.265625, "learning_rate": 4.945e-05, "loss": 1.0253, "step": 990 }, { "contrastive_loss": 4.4615478515625, "epoch": 0.11736810906935388, "mse_loss": 0.12058433145284653, "step": 990 }, { "epoch": 0.11855364552459988, "grad_norm": 1.3203125, "learning_rate": 4.995e-05, "loss": 1.0183, "step": 1000 }, { "contrastive_loss": 4.324462890625, "epoch": 0.11855364552459988, "mse_loss": 0.13803984224796295, "step": 1000 }, { "epoch": 0.11973918197984589, "grad_norm": 1.2734375, "learning_rate": 5.045e-05, "loss": 1.0162, "step": 1010 }, { "contrastive_loss": 4.4793701171875, "epoch": 0.11973918197984589, "mse_loss": 0.14454035460948944, "step": 1010 }, { "epoch": 0.12092471843509188, "grad_norm": 1.2890625, "learning_rate": 5.095e-05, "loss": 1.0262, "step": 1020 }, { "contrastive_loss": 4.491943359375, "epoch": 0.12092471843509188, "mse_loss": 0.16094525158405304, "step": 1020 }, { "epoch": 0.12211025489033787, "grad_norm": 1.53125, "learning_rate": 5.145e-05, "loss": 1.0188, "step": 1030 }, { "contrastive_loss": 4.38330078125, "epoch": 0.12211025489033787, "mse_loss": 0.1571045219898224, "step": 1030 }, { "epoch": 0.12329579134558388, "grad_norm": 1.546875, "learning_rate": 5.1949999999999996e-05, "loss": 1.0246, "step": 1040 }, { "contrastive_loss": 4.4735107421875, "epoch": 0.12329579134558388, "mse_loss": 0.11645889282226562, "step": 1040 }, { "epoch": 0.12448132780082988, "grad_norm": 1.2109375, "learning_rate": 5.245e-05, "loss": 1.012, "step": 1050 }, { "contrastive_loss": 4.4150390625, "epoch": 0.12448132780082988, "mse_loss": 0.12138732522726059, "step": 1050 }, { "epoch": 0.12566686425607587, "grad_norm": 1.578125, "learning_rate": 5.295e-05, "loss": 1.0217, "step": 1060 }, { "contrastive_loss": 4.557373046875, "epoch": 0.12566686425607587, "mse_loss": 0.14879122376441956, "step": 1060 }, { "epoch": 0.12685240071132187, "grad_norm": 1.390625, "learning_rate": 5.345e-05, "loss": 1.0272, "step": 1070 }, { "contrastive_loss": 4.345947265625, "epoch": 0.12685240071132187, "mse_loss": 0.16460701823234558, "step": 1070 }, { "epoch": 0.12803793716656786, "grad_norm": 1.6328125, "learning_rate": 5.3950000000000004e-05, "loss": 1.0155, "step": 1080 }, { "contrastive_loss": 4.2982177734375, "epoch": 0.12803793716656786, "mse_loss": 0.12065846472978592, "step": 1080 }, { "epoch": 0.12922347362181388, "grad_norm": 1.65625, "learning_rate": 5.445e-05, "loss": 1.0021, "step": 1090 }, { "contrastive_loss": 4.3848876953125, "epoch": 0.12922347362181388, "mse_loss": 0.14166076481342316, "step": 1090 }, { "epoch": 0.13040901007705988, "grad_norm": 1.7734375, "learning_rate": 5.495e-05, "loss": 1.015, "step": 1100 }, { "contrastive_loss": 4.4365234375, "epoch": 0.13040901007705988, "mse_loss": 0.11627322435379028, "step": 1100 }, { "epoch": 0.13159454653230587, "grad_norm": 1.4140625, "learning_rate": 5.545e-05, "loss": 1.008, "step": 1110 }, { "contrastive_loss": 4.39111328125, "epoch": 0.13159454653230587, "mse_loss": 0.14318551123142242, "step": 1110 }, { "epoch": 0.13278008298755187, "grad_norm": 1.140625, "learning_rate": 5.5950000000000005e-05, "loss": 1.0092, "step": 1120 }, { "contrastive_loss": 4.4024658203125, "epoch": 0.13278008298755187, "mse_loss": 0.13138417899608612, "step": 1120 }, { "epoch": 0.13396561944279786, "grad_norm": 1.03125, "learning_rate": 5.645e-05, "loss": 1.0052, "step": 1130 }, { "contrastive_loss": 4.467529296875, "epoch": 0.13396561944279786, "mse_loss": 0.12093173712491989, "step": 1130 }, { "epoch": 0.13515115589804386, "grad_norm": 1.4296875, "learning_rate": 5.695e-05, "loss": 1.0211, "step": 1140 }, { "contrastive_loss": 4.27685546875, "epoch": 0.13515115589804386, "mse_loss": 0.12921595573425293, "step": 1140 }, { "epoch": 0.13633669235328985, "grad_norm": 1.328125, "learning_rate": 5.745e-05, "loss": 1.0118, "step": 1150 }, { "contrastive_loss": 4.3140869140625, "epoch": 0.13633669235328985, "mse_loss": 0.10838256031274796, "step": 1150 }, { "epoch": 0.13752222880853587, "grad_norm": 1.4140625, "learning_rate": 5.7950000000000006e-05, "loss": 0.9958, "step": 1160 }, { "contrastive_loss": 4.2861328125, "epoch": 0.13752222880853587, "mse_loss": 0.139155775308609, "step": 1160 }, { "epoch": 0.13870776526378187, "grad_norm": 1.2578125, "learning_rate": 5.8450000000000005e-05, "loss": 1.007, "step": 1170 }, { "contrastive_loss": 4.5589599609375, "epoch": 0.13870776526378187, "mse_loss": 0.13191832602024078, "step": 1170 }, { "epoch": 0.13989330171902786, "grad_norm": 1.5390625, "learning_rate": 5.895e-05, "loss": 0.9922, "step": 1180 }, { "contrastive_loss": 4.3570556640625, "epoch": 0.13989330171902786, "mse_loss": 0.08645403385162354, "step": 1180 }, { "epoch": 0.14107883817427386, "grad_norm": 1.96875, "learning_rate": 5.945000000000001e-05, "loss": 0.9884, "step": 1190 }, { "contrastive_loss": 4.393798828125, "epoch": 0.14107883817427386, "mse_loss": 0.12360095977783203, "step": 1190 }, { "epoch": 0.14226437462951985, "grad_norm": 1.453125, "learning_rate": 5.995000000000001e-05, "loss": 1.0007, "step": 1200 }, { "contrastive_loss": 4.39306640625, "epoch": 0.14226437462951985, "mse_loss": 0.13033276796340942, "step": 1200 }, { "epoch": 0.14344991108476585, "grad_norm": 1.5390625, "learning_rate": 6.0450000000000006e-05, "loss": 0.9934, "step": 1210 }, { "contrastive_loss": 4.3907470703125, "epoch": 0.14344991108476585, "mse_loss": 0.15238641202449799, "step": 1210 }, { "epoch": 0.14463544754001187, "grad_norm": 1.03125, "learning_rate": 6.0950000000000004e-05, "loss": 1.0015, "step": 1220 }, { "contrastive_loss": 4.44775390625, "epoch": 0.14463544754001187, "mse_loss": 0.13099659979343414, "step": 1220 }, { "epoch": 0.14582098399525786, "grad_norm": 1.2734375, "learning_rate": 6.145e-05, "loss": 1.0, "step": 1230 }, { "contrastive_loss": 4.3974609375, "epoch": 0.14582098399525786, "mse_loss": 0.15997307002544403, "step": 1230 }, { "epoch": 0.14700652045050386, "grad_norm": 1.5390625, "learning_rate": 6.195e-05, "loss": 0.9853, "step": 1240 }, { "contrastive_loss": 4.5220947265625, "epoch": 0.14700652045050386, "mse_loss": 0.15793175995349884, "step": 1240 }, { "epoch": 0.14819205690574985, "grad_norm": 1.2890625, "learning_rate": 6.245000000000001e-05, "loss": 1.0128, "step": 1250 }, { "contrastive_loss": 4.3785400390625, "epoch": 0.14819205690574985, "mse_loss": 0.12808099389076233, "step": 1250 }, { "epoch": 0.14937759336099585, "grad_norm": 1.109375, "learning_rate": 6.295e-05, "loss": 0.9938, "step": 1260 }, { "contrastive_loss": 4.2698974609375, "epoch": 0.14937759336099585, "mse_loss": 0.1473233997821808, "step": 1260 }, { "epoch": 0.15056312981624184, "grad_norm": 0.984375, "learning_rate": 6.345e-05, "loss": 1.0049, "step": 1270 }, { "contrastive_loss": 4.28076171875, "epoch": 0.15056312981624184, "mse_loss": 0.09115008264780045, "step": 1270 }, { "epoch": 0.15174866627148784, "grad_norm": 1.234375, "learning_rate": 6.395e-05, "loss": 0.9927, "step": 1280 }, { "contrastive_loss": 4.3397216796875, "epoch": 0.15174866627148784, "mse_loss": 0.13002793490886688, "step": 1280 }, { "epoch": 0.15293420272673386, "grad_norm": 1.125, "learning_rate": 6.445e-05, "loss": 0.9962, "step": 1290 }, { "contrastive_loss": 4.335693359375, "epoch": 0.15293420272673386, "mse_loss": 0.11734514683485031, "step": 1290 }, { "epoch": 0.15411973918197985, "grad_norm": 1.0703125, "learning_rate": 6.494999999999999e-05, "loss": 0.9856, "step": 1300 }, { "contrastive_loss": 4.3775634765625, "epoch": 0.15411973918197985, "mse_loss": 0.07884640991687775, "step": 1300 }, { "epoch": 0.15530527563722585, "grad_norm": 1.2421875, "learning_rate": 6.545e-05, "loss": 0.9904, "step": 1310 }, { "contrastive_loss": 4.216064453125, "epoch": 0.15530527563722585, "mse_loss": 0.17731989920139313, "step": 1310 }, { "epoch": 0.15649081209247184, "grad_norm": 0.90234375, "learning_rate": 6.595e-05, "loss": 0.9813, "step": 1320 }, { "contrastive_loss": 4.228271484375, "epoch": 0.15649081209247184, "mse_loss": 0.17569664120674133, "step": 1320 }, { "epoch": 0.15767634854771784, "grad_norm": 1.2109375, "learning_rate": 6.645e-05, "loss": 0.9818, "step": 1330 }, { "contrastive_loss": 4.1724853515625, "epoch": 0.15767634854771784, "mse_loss": 0.12328781187534332, "step": 1330 }, { "epoch": 0.15886188500296383, "grad_norm": 1.2421875, "learning_rate": 6.695e-05, "loss": 0.9906, "step": 1340 }, { "contrastive_loss": 4.5040283203125, "epoch": 0.15886188500296383, "mse_loss": 0.11902057379484177, "step": 1340 }, { "epoch": 0.16004742145820983, "grad_norm": 1.234375, "learning_rate": 6.745e-05, "loss": 0.9872, "step": 1350 }, { "contrastive_loss": 4.228271484375, "epoch": 0.16004742145820983, "mse_loss": 0.09324859082698822, "step": 1350 }, { "epoch": 0.16123295791345585, "grad_norm": 1.5234375, "learning_rate": 6.795e-05, "loss": 0.9807, "step": 1360 }, { "contrastive_loss": 4.209228515625, "epoch": 0.16123295791345585, "mse_loss": 0.12618182599544525, "step": 1360 }, { "epoch": 0.16241849436870184, "grad_norm": 1.0859375, "learning_rate": 6.845e-05, "loss": 0.9584, "step": 1370 }, { "contrastive_loss": 4.3067626953125, "epoch": 0.16241849436870184, "mse_loss": 0.11295019835233688, "step": 1370 }, { "epoch": 0.16360403082394784, "grad_norm": 1.1328125, "learning_rate": 6.895000000000001e-05, "loss": 0.9796, "step": 1380 }, { "contrastive_loss": 4.3511962890625, "epoch": 0.16360403082394784, "mse_loss": 0.12488330155611038, "step": 1380 }, { "epoch": 0.16478956727919383, "grad_norm": 1.0546875, "learning_rate": 6.945000000000001e-05, "loss": 0.9667, "step": 1390 }, { "contrastive_loss": 4.2166748046875, "epoch": 0.16478956727919383, "mse_loss": 0.12394828349351883, "step": 1390 }, { "epoch": 0.16597510373443983, "grad_norm": 1.03125, "learning_rate": 6.995e-05, "loss": 0.992, "step": 1400 }, { "contrastive_loss": 4.2176513671875, "epoch": 0.16597510373443983, "mse_loss": 0.12171681970357895, "step": 1400 }, { "epoch": 0.16716064018968582, "grad_norm": 1.0546875, "learning_rate": 7.045e-05, "loss": 0.9517, "step": 1410 }, { "contrastive_loss": 4.3387451171875, "epoch": 0.16716064018968582, "mse_loss": 0.10624518245458603, "step": 1410 }, { "epoch": 0.16834617664493184, "grad_norm": 1.15625, "learning_rate": 7.095e-05, "loss": 0.9805, "step": 1420 }, { "contrastive_loss": 4.3096923828125, "epoch": 0.16834617664493184, "mse_loss": 0.10782011598348618, "step": 1420 }, { "epoch": 0.16953171310017784, "grad_norm": 1.0546875, "learning_rate": 7.145e-05, "loss": 0.9783, "step": 1430 }, { "contrastive_loss": 4.1890869140625, "epoch": 0.16953171310017784, "mse_loss": 0.13114988803863525, "step": 1430 }, { "epoch": 0.17071724955542383, "grad_norm": 1.0, "learning_rate": 7.195e-05, "loss": 0.9799, "step": 1440 }, { "contrastive_loss": 4.235107421875, "epoch": 0.17071724955542383, "mse_loss": 0.07127879559993744, "step": 1440 }, { "epoch": 0.17190278601066983, "grad_norm": 1.15625, "learning_rate": 7.245000000000001e-05, "loss": 0.9743, "step": 1450 }, { "contrastive_loss": 4.1944580078125, "epoch": 0.17190278601066983, "mse_loss": 0.11541880667209625, "step": 1450 }, { "epoch": 0.17308832246591582, "grad_norm": 1.1640625, "learning_rate": 7.295000000000001e-05, "loss": 0.9775, "step": 1460 }, { "contrastive_loss": 4.407470703125, "epoch": 0.17308832246591582, "mse_loss": 0.12938758730888367, "step": 1460 }, { "epoch": 0.17427385892116182, "grad_norm": 0.96484375, "learning_rate": 7.345000000000001e-05, "loss": 0.9874, "step": 1470 }, { "contrastive_loss": 4.322509765625, "epoch": 0.17427385892116182, "mse_loss": 0.14528608322143555, "step": 1470 }, { "epoch": 0.1754593953764078, "grad_norm": 2.75, "learning_rate": 7.395000000000001e-05, "loss": 0.9897, "step": 1480 }, { "contrastive_loss": 4.2852783203125, "epoch": 0.1754593953764078, "mse_loss": 0.12063200026750565, "step": 1480 }, { "epoch": 0.17664493183165383, "grad_norm": 1.1796875, "learning_rate": 7.445000000000001e-05, "loss": 0.9802, "step": 1490 }, { "contrastive_loss": 4.32177734375, "epoch": 0.17664493183165383, "mse_loss": 0.11678945273160934, "step": 1490 }, { "epoch": 0.17783046828689983, "grad_norm": 1.1171875, "learning_rate": 7.495e-05, "loss": 0.9998, "step": 1500 }, { "contrastive_loss": 4.2510986328125, "epoch": 0.17783046828689983, "mse_loss": 0.14115972816944122, "step": 1500 }, { "epoch": 0.17901600474214582, "grad_norm": 0.90234375, "learning_rate": 7.545e-05, "loss": 0.9817, "step": 1510 }, { "contrastive_loss": 4.202880859375, "epoch": 0.17901600474214582, "mse_loss": 0.13399504125118256, "step": 1510 }, { "epoch": 0.18020154119739182, "grad_norm": 1.5, "learning_rate": 7.595e-05, "loss": 0.9796, "step": 1520 }, { "contrastive_loss": 4.3336181640625, "epoch": 0.18020154119739182, "mse_loss": 0.13779492676258087, "step": 1520 }, { "epoch": 0.1813870776526378, "grad_norm": 1.1171875, "learning_rate": 7.645e-05, "loss": 0.981, "step": 1530 }, { "contrastive_loss": 4.1884765625, "epoch": 0.1813870776526378, "mse_loss": 0.10163839906454086, "step": 1530 }, { "epoch": 0.1825726141078838, "grad_norm": 1.109375, "learning_rate": 7.695e-05, "loss": 0.9799, "step": 1540 }, { "contrastive_loss": 4.096435546875, "epoch": 0.1825726141078838, "mse_loss": 0.1465039700269699, "step": 1540 }, { "epoch": 0.18375815056312983, "grad_norm": 1.1328125, "learning_rate": 7.745e-05, "loss": 0.9826, "step": 1550 }, { "contrastive_loss": 4.25390625, "epoch": 0.18375815056312983, "mse_loss": 0.10464929044246674, "step": 1550 }, { "epoch": 0.18494368701837582, "grad_norm": 1.2109375, "learning_rate": 7.795e-05, "loss": 0.9722, "step": 1560 }, { "contrastive_loss": 4.3299560546875, "epoch": 0.18494368701837582, "mse_loss": 0.12820297479629517, "step": 1560 }, { "epoch": 0.18612922347362182, "grad_norm": 1.0703125, "learning_rate": 7.845e-05, "loss": 0.9514, "step": 1570 }, { "contrastive_loss": 4.291015625, "epoch": 0.18612922347362182, "mse_loss": 0.12890414893627167, "step": 1570 }, { "epoch": 0.1873147599288678, "grad_norm": 1.0859375, "learning_rate": 7.895000000000001e-05, "loss": 0.9605, "step": 1580 }, { "contrastive_loss": 4.3599853515625, "epoch": 0.1873147599288678, "mse_loss": 0.14261029660701752, "step": 1580 }, { "epoch": 0.1885002963841138, "grad_norm": 1.03125, "learning_rate": 7.945e-05, "loss": 0.9781, "step": 1590 }, { "contrastive_loss": 4.3380126953125, "epoch": 0.1885002963841138, "mse_loss": 0.10146557539701462, "step": 1590 }, { "epoch": 0.1896858328393598, "grad_norm": 0.8125, "learning_rate": 7.995e-05, "loss": 0.9659, "step": 1600 }, { "contrastive_loss": 4.135986328125, "epoch": 0.1896858328393598, "mse_loss": 0.05550520867109299, "step": 1600 }, { "epoch": 0.1908713692946058, "grad_norm": 0.89453125, "learning_rate": 8.045e-05, "loss": 0.9426, "step": 1610 }, { "contrastive_loss": 4.3958740234375, "epoch": 0.1908713692946058, "mse_loss": 0.10940030962228775, "step": 1610 }, { "epoch": 0.19205690574985182, "grad_norm": 1.1484375, "learning_rate": 8.095e-05, "loss": 0.9594, "step": 1620 }, { "contrastive_loss": 4.244384765625, "epoch": 0.19205690574985182, "mse_loss": 0.09991540014743805, "step": 1620 }, { "epoch": 0.19324244220509781, "grad_norm": 0.91796875, "learning_rate": 8.145e-05, "loss": 0.9745, "step": 1630 }, { "contrastive_loss": 4.21923828125, "epoch": 0.19324244220509781, "mse_loss": 0.13173292577266693, "step": 1630 }, { "epoch": 0.1944279786603438, "grad_norm": 0.890625, "learning_rate": 8.195e-05, "loss": 0.9661, "step": 1640 }, { "contrastive_loss": 4.265869140625, "epoch": 0.1944279786603438, "mse_loss": 0.08940328657627106, "step": 1640 }, { "epoch": 0.1956135151155898, "grad_norm": 0.890625, "learning_rate": 8.245e-05, "loss": 0.957, "step": 1650 }, { "contrastive_loss": 4.214599609375, "epoch": 0.1956135151155898, "mse_loss": 0.09421265125274658, "step": 1650 }, { "epoch": 0.1967990515708358, "grad_norm": 1.1484375, "learning_rate": 8.295000000000001e-05, "loss": 0.9614, "step": 1660 }, { "contrastive_loss": 4.3580322265625, "epoch": 0.1967990515708358, "mse_loss": 0.08690629154443741, "step": 1660 }, { "epoch": 0.1979845880260818, "grad_norm": 1.3046875, "learning_rate": 8.345000000000001e-05, "loss": 0.9566, "step": 1670 }, { "contrastive_loss": 4.2891845703125, "epoch": 0.1979845880260818, "mse_loss": 0.13481296598911285, "step": 1670 }, { "epoch": 0.1991701244813278, "grad_norm": 0.9140625, "learning_rate": 8.395000000000001e-05, "loss": 0.9579, "step": 1680 }, { "contrastive_loss": 4.2740478515625, "epoch": 0.1991701244813278, "mse_loss": 0.11066146939992905, "step": 1680 }, { "epoch": 0.2003556609365738, "grad_norm": 1.234375, "learning_rate": 8.445e-05, "loss": 0.9742, "step": 1690 }, { "contrastive_loss": 4.124267578125, "epoch": 0.2003556609365738, "mse_loss": 0.09681577235460281, "step": 1690 }, { "epoch": 0.2015411973918198, "grad_norm": 0.828125, "learning_rate": 8.495e-05, "loss": 0.9555, "step": 1700 }, { "contrastive_loss": 4.2947998046875, "epoch": 0.2015411973918198, "mse_loss": 0.0964650958776474, "step": 1700 }, { "epoch": 0.2027267338470658, "grad_norm": 0.99609375, "learning_rate": 8.545e-05, "loss": 0.9558, "step": 1710 }, { "contrastive_loss": 4.2586669921875, "epoch": 0.2027267338470658, "mse_loss": 0.1060178130865097, "step": 1710 }, { "epoch": 0.2039122703023118, "grad_norm": 0.85546875, "learning_rate": 8.595e-05, "loss": 0.9612, "step": 1720 }, { "contrastive_loss": 4.2193603515625, "epoch": 0.2039122703023118, "mse_loss": 0.14171317219734192, "step": 1720 }, { "epoch": 0.2050978067575578, "grad_norm": 0.90234375, "learning_rate": 8.645000000000001e-05, "loss": 0.9584, "step": 1730 }, { "contrastive_loss": 4.2899169921875, "epoch": 0.2050978067575578, "mse_loss": 0.09104941040277481, "step": 1730 }, { "epoch": 0.20628334321280378, "grad_norm": 1.3984375, "learning_rate": 8.695000000000001e-05, "loss": 0.9498, "step": 1740 }, { "contrastive_loss": 4.1492919921875, "epoch": 0.20628334321280378, "mse_loss": 0.12872955203056335, "step": 1740 }, { "epoch": 0.2074688796680498, "grad_norm": 1.1875, "learning_rate": 8.745000000000001e-05, "loss": 0.9487, "step": 1750 }, { "contrastive_loss": 4.263916015625, "epoch": 0.2074688796680498, "mse_loss": 0.15363569557666779, "step": 1750 }, { "epoch": 0.2086544161232958, "grad_norm": 1.28125, "learning_rate": 8.795e-05, "loss": 0.967, "step": 1760 }, { "contrastive_loss": 4.082275390625, "epoch": 0.2086544161232958, "mse_loss": 0.10705146938562393, "step": 1760 }, { "epoch": 0.2098399525785418, "grad_norm": 1.1328125, "learning_rate": 8.845e-05, "loss": 0.9471, "step": 1770 }, { "contrastive_loss": 4.22119140625, "epoch": 0.2098399525785418, "mse_loss": 0.09989335387945175, "step": 1770 }, { "epoch": 0.2110254890337878, "grad_norm": 0.7734375, "learning_rate": 8.895e-05, "loss": 0.9602, "step": 1780 }, { "contrastive_loss": 4.26025390625, "epoch": 0.2110254890337878, "mse_loss": 0.10300062596797943, "step": 1780 }, { "epoch": 0.21221102548903378, "grad_norm": 0.94140625, "learning_rate": 8.945e-05, "loss": 0.9601, "step": 1790 }, { "contrastive_loss": 4.193603515625, "epoch": 0.21221102548903378, "mse_loss": 0.09371506422758102, "step": 1790 }, { "epoch": 0.21339656194427978, "grad_norm": 1.3671875, "learning_rate": 8.995e-05, "loss": 0.9559, "step": 1800 }, { "contrastive_loss": 4.1513671875, "epoch": 0.21339656194427978, "mse_loss": 0.0837266594171524, "step": 1800 }, { "epoch": 0.21458209839952577, "grad_norm": 0.94921875, "learning_rate": 9.045e-05, "loss": 0.9564, "step": 1810 }, { "contrastive_loss": 4.2445068359375, "epoch": 0.21458209839952577, "mse_loss": 0.1212659552693367, "step": 1810 }, { "epoch": 0.2157676348547718, "grad_norm": 0.80078125, "learning_rate": 9.095e-05, "loss": 0.9381, "step": 1820 }, { "contrastive_loss": 4.17578125, "epoch": 0.2157676348547718, "mse_loss": 0.12286027520895004, "step": 1820 }, { "epoch": 0.2169531713100178, "grad_norm": 1.0625, "learning_rate": 9.145e-05, "loss": 0.9393, "step": 1830 }, { "contrastive_loss": 4.1749267578125, "epoch": 0.2169531713100178, "mse_loss": 0.1177624836564064, "step": 1830 }, { "epoch": 0.21813870776526378, "grad_norm": 0.9609375, "learning_rate": 9.195e-05, "loss": 0.9412, "step": 1840 }, { "contrastive_loss": 4.1788330078125, "epoch": 0.21813870776526378, "mse_loss": 0.14474156498908997, "step": 1840 }, { "epoch": 0.21932424422050978, "grad_norm": 0.94921875, "learning_rate": 9.245e-05, "loss": 0.9438, "step": 1850 }, { "contrastive_loss": 4.3040771484375, "epoch": 0.21932424422050978, "mse_loss": 0.09326786547899246, "step": 1850 }, { "epoch": 0.22050978067575577, "grad_norm": 1.1328125, "learning_rate": 9.295000000000001e-05, "loss": 0.9412, "step": 1860 }, { "contrastive_loss": 4.1260986328125, "epoch": 0.22050978067575577, "mse_loss": 0.12067258358001709, "step": 1860 }, { "epoch": 0.22169531713100177, "grad_norm": 1.03125, "learning_rate": 9.345000000000001e-05, "loss": 0.9484, "step": 1870 }, { "contrastive_loss": 4.18896484375, "epoch": 0.22169531713100177, "mse_loss": 0.14656202495098114, "step": 1870 }, { "epoch": 0.2228808535862478, "grad_norm": 1.1875, "learning_rate": 9.395000000000001e-05, "loss": 0.9519, "step": 1880 }, { "contrastive_loss": 4.1256103515625, "epoch": 0.2228808535862478, "mse_loss": 0.09957260638475418, "step": 1880 }, { "epoch": 0.22406639004149378, "grad_norm": 0.89453125, "learning_rate": 9.445e-05, "loss": 0.9374, "step": 1890 }, { "contrastive_loss": 4.0504150390625, "epoch": 0.22406639004149378, "mse_loss": 0.11110533773899078, "step": 1890 }, { "epoch": 0.22525192649673978, "grad_norm": 0.87109375, "learning_rate": 9.495e-05, "loss": 0.9518, "step": 1900 }, { "contrastive_loss": 4.250732421875, "epoch": 0.22525192649673978, "mse_loss": 0.13271529972553253, "step": 1900 }, { "epoch": 0.22643746295198577, "grad_norm": 0.86328125, "learning_rate": 9.545e-05, "loss": 0.9516, "step": 1910 }, { "contrastive_loss": 4.201171875, "epoch": 0.22643746295198577, "mse_loss": 0.09657766669988632, "step": 1910 }, { "epoch": 0.22762299940723177, "grad_norm": 0.828125, "learning_rate": 9.595e-05, "loss": 0.9513, "step": 1920 }, { "contrastive_loss": 4.120849609375, "epoch": 0.22762299940723177, "mse_loss": 0.12573781609535217, "step": 1920 }, { "epoch": 0.22880853586247776, "grad_norm": 0.7734375, "learning_rate": 9.645000000000001e-05, "loss": 0.9396, "step": 1930 }, { "contrastive_loss": 4.2469482421875, "epoch": 0.22880853586247776, "mse_loss": 0.11133687943220139, "step": 1930 }, { "epoch": 0.22999407231772376, "grad_norm": 1.359375, "learning_rate": 9.695000000000001e-05, "loss": 0.9497, "step": 1940 }, { "contrastive_loss": 4.157470703125, "epoch": 0.22999407231772376, "mse_loss": 0.103839211165905, "step": 1940 }, { "epoch": 0.23117960877296978, "grad_norm": 1.0078125, "learning_rate": 9.745000000000001e-05, "loss": 0.9478, "step": 1950 }, { "contrastive_loss": 4.186279296875, "epoch": 0.23117960877296978, "mse_loss": 0.10699611902236938, "step": 1950 }, { "epoch": 0.23236514522821577, "grad_norm": 0.9296875, "learning_rate": 9.795000000000001e-05, "loss": 0.9272, "step": 1960 }, { "contrastive_loss": 4.1700439453125, "epoch": 0.23236514522821577, "mse_loss": 0.1298399269580841, "step": 1960 }, { "epoch": 0.23355068168346177, "grad_norm": 1.140625, "learning_rate": 9.845000000000001e-05, "loss": 0.9611, "step": 1970 }, { "contrastive_loss": 4.2760009765625, "epoch": 0.23355068168346177, "mse_loss": 0.09741204231977463, "step": 1970 }, { "epoch": 0.23473621813870776, "grad_norm": 0.98828125, "learning_rate": 9.895e-05, "loss": 0.9579, "step": 1980 }, { "contrastive_loss": 4.3140869140625, "epoch": 0.23473621813870776, "mse_loss": 0.10733260214328766, "step": 1980 }, { "epoch": 0.23592175459395376, "grad_norm": 0.8515625, "learning_rate": 9.945e-05, "loss": 0.9497, "step": 1990 }, { "contrastive_loss": 4.20751953125, "epoch": 0.23592175459395376, "mse_loss": 0.08575756102800369, "step": 1990 }, { "epoch": 0.23710729104919975, "grad_norm": 1.0703125, "learning_rate": 9.995e-05, "loss": 0.9502, "step": 2000 }, { "contrastive_loss": 4.2021484375, "epoch": 0.23710729104919975, "mse_loss": 0.10003005713224411, "step": 2000 }, { "epoch": 0.23829282750444578, "grad_norm": 0.796875, "learning_rate": 0.00010045, "loss": 0.9372, "step": 2010 }, { "contrastive_loss": 4.0936279296875, "epoch": 0.23829282750444578, "mse_loss": 0.13799813389778137, "step": 2010 }, { "epoch": 0.23947836395969177, "grad_norm": 0.953125, "learning_rate": 0.00010095000000000001, "loss": 0.9495, "step": 2020 }, { "contrastive_loss": 4.16845703125, "epoch": 0.23947836395969177, "mse_loss": 0.11558067798614502, "step": 2020 }, { "epoch": 0.24066390041493776, "grad_norm": 0.8359375, "learning_rate": 0.00010145, "loss": 0.9474, "step": 2030 }, { "contrastive_loss": 4.12060546875, "epoch": 0.24066390041493776, "mse_loss": 0.09353803098201752, "step": 2030 }, { "epoch": 0.24184943687018376, "grad_norm": 0.7109375, "learning_rate": 0.00010195000000000001, "loss": 0.9382, "step": 2040 }, { "contrastive_loss": 4.2857666015625, "epoch": 0.24184943687018376, "mse_loss": 0.12248522788286209, "step": 2040 }, { "epoch": 0.24303497332542975, "grad_norm": 1.0234375, "learning_rate": 0.00010245, "loss": 0.9605, "step": 2050 }, { "contrastive_loss": 4.4405517578125, "epoch": 0.24303497332542975, "mse_loss": 0.08722901344299316, "step": 2050 }, { "epoch": 0.24422050978067575, "grad_norm": 0.8984375, "learning_rate": 0.00010295000000000001, "loss": 0.9541, "step": 2060 }, { "contrastive_loss": 4.280029296875, "epoch": 0.24422050978067575, "mse_loss": 0.12829391658306122, "step": 2060 }, { "epoch": 0.24540604623592174, "grad_norm": 0.7890625, "learning_rate": 0.00010345000000000001, "loss": 0.9401, "step": 2070 }, { "contrastive_loss": 4.157958984375, "epoch": 0.24540604623592174, "mse_loss": 0.09049161523580551, "step": 2070 }, { "epoch": 0.24659158269116777, "grad_norm": 0.7890625, "learning_rate": 0.00010395000000000002, "loss": 0.936, "step": 2080 }, { "contrastive_loss": 4.0238037109375, "epoch": 0.24659158269116777, "mse_loss": 0.11914390325546265, "step": 2080 }, { "epoch": 0.24777711914641376, "grad_norm": 1.1640625, "learning_rate": 0.00010445, "loss": 0.9356, "step": 2090 }, { "contrastive_loss": 4.1146240234375, "epoch": 0.24777711914641376, "mse_loss": 0.07598469406366348, "step": 2090 }, { "epoch": 0.24896265560165975, "grad_norm": 1.1953125, "learning_rate": 0.00010495000000000002, "loss": 0.9343, "step": 2100 }, { "contrastive_loss": 4.10498046875, "epoch": 0.24896265560165975, "mse_loss": 0.10189808905124664, "step": 2100 }, { "epoch": 0.25014819205690575, "grad_norm": 0.953125, "learning_rate": 0.00010545, "loss": 0.9408, "step": 2110 }, { "contrastive_loss": 4.226318359375, "epoch": 0.25014819205690575, "mse_loss": 0.10697383433580399, "step": 2110 }, { "epoch": 0.25133372851215174, "grad_norm": 0.9375, "learning_rate": 0.00010595000000000001, "loss": 0.9295, "step": 2120 }, { "contrastive_loss": 4.03564453125, "epoch": 0.25133372851215174, "mse_loss": 0.09470327198505402, "step": 2120 }, { "epoch": 0.25251926496739774, "grad_norm": 0.765625, "learning_rate": 0.00010645, "loss": 0.9364, "step": 2130 }, { "contrastive_loss": 4.19775390625, "epoch": 0.25251926496739774, "mse_loss": 0.08524157106876373, "step": 2130 }, { "epoch": 0.25370480142264373, "grad_norm": 0.98828125, "learning_rate": 0.00010695, "loss": 0.9422, "step": 2140 }, { "contrastive_loss": 4.109375, "epoch": 0.25370480142264373, "mse_loss": 0.1580784022808075, "step": 2140 }, { "epoch": 0.2548903378778897, "grad_norm": 0.9140625, "learning_rate": 0.00010745000000000001, "loss": 0.9432, "step": 2150 }, { "contrastive_loss": 4.0654296875, "epoch": 0.2548903378778897, "mse_loss": 0.1260327845811844, "step": 2150 }, { "epoch": 0.2560758743331357, "grad_norm": 0.97265625, "learning_rate": 0.00010795, "loss": 0.9435, "step": 2160 }, { "contrastive_loss": 4.2244873046875, "epoch": 0.2560758743331357, "mse_loss": 0.12566527724266052, "step": 2160 }, { "epoch": 0.2572614107883817, "grad_norm": 0.8046875, "learning_rate": 0.00010845000000000001, "loss": 0.9429, "step": 2170 }, { "contrastive_loss": 4.3414306640625, "epoch": 0.2572614107883817, "mse_loss": 0.08097697794437408, "step": 2170 }, { "epoch": 0.25844694724362777, "grad_norm": 1.25, "learning_rate": 0.00010894999999999999, "loss": 0.9363, "step": 2180 }, { "contrastive_loss": 4.2471923828125, "epoch": 0.25844694724362777, "mse_loss": 0.10569234192371368, "step": 2180 }, { "epoch": 0.25963248369887376, "grad_norm": 0.796875, "learning_rate": 0.00010945, "loss": 0.9382, "step": 2190 }, { "contrastive_loss": 4.2686767578125, "epoch": 0.25963248369887376, "mse_loss": 0.12862789630889893, "step": 2190 }, { "epoch": 0.26081802015411976, "grad_norm": 0.9765625, "learning_rate": 0.00010995, "loss": 0.9658, "step": 2200 }, { "contrastive_loss": 4.041259765625, "epoch": 0.26081802015411976, "mse_loss": 0.10367345809936523, "step": 2200 }, { "epoch": 0.26200355660936575, "grad_norm": 0.73828125, "learning_rate": 0.00011045000000000001, "loss": 0.9338, "step": 2210 }, { "contrastive_loss": 4.115478515625, "epoch": 0.26200355660936575, "mse_loss": 0.10416799038648605, "step": 2210 }, { "epoch": 0.26318909306461175, "grad_norm": 0.8828125, "learning_rate": 0.00011095, "loss": 0.9331, "step": 2220 }, { "contrastive_loss": 4.079833984375, "epoch": 0.26318909306461175, "mse_loss": 0.12544551491737366, "step": 2220 }, { "epoch": 0.26437462951985774, "grad_norm": 0.94921875, "learning_rate": 0.00011145000000000001, "loss": 0.9318, "step": 2230 }, { "contrastive_loss": 4.2010498046875, "epoch": 0.26437462951985774, "mse_loss": 0.11763028055429459, "step": 2230 }, { "epoch": 0.26556016597510373, "grad_norm": 0.7578125, "learning_rate": 0.00011195, "loss": 0.9394, "step": 2240 }, { "contrastive_loss": 3.99560546875, "epoch": 0.26556016597510373, "mse_loss": 0.10625506192445755, "step": 2240 }, { "epoch": 0.26674570243034973, "grad_norm": 0.72265625, "learning_rate": 0.00011245000000000001, "loss": 0.9429, "step": 2250 }, { "contrastive_loss": 4.2054443359375, "epoch": 0.26674570243034973, "mse_loss": 0.07600294053554535, "step": 2250 }, { "epoch": 0.2679312388855957, "grad_norm": 0.66015625, "learning_rate": 0.00011295, "loss": 0.9435, "step": 2260 }, { "contrastive_loss": 4.1497802734375, "epoch": 0.2679312388855957, "mse_loss": 0.1267300397157669, "step": 2260 }, { "epoch": 0.2691167753408417, "grad_norm": 0.828125, "learning_rate": 0.00011345, "loss": 0.9447, "step": 2270 }, { "contrastive_loss": 4.067626953125, "epoch": 0.2691167753408417, "mse_loss": 0.11929547041654587, "step": 2270 }, { "epoch": 0.2703023117960877, "grad_norm": 0.890625, "learning_rate": 0.00011395, "loss": 0.9437, "step": 2280 }, { "contrastive_loss": 4.1259765625, "epoch": 0.2703023117960877, "mse_loss": 0.1080135926604271, "step": 2280 }, { "epoch": 0.2714878482513337, "grad_norm": 0.84765625, "learning_rate": 0.00011445000000000002, "loss": 0.9379, "step": 2290 }, { "contrastive_loss": 4.1778564453125, "epoch": 0.2714878482513337, "mse_loss": 0.11474042385816574, "step": 2290 }, { "epoch": 0.2726733847065797, "grad_norm": 0.73046875, "learning_rate": 0.00011495, "loss": 0.9251, "step": 2300 }, { "contrastive_loss": 4.0677490234375, "epoch": 0.2726733847065797, "mse_loss": 0.11694078892469406, "step": 2300 }, { "epoch": 0.27385892116182575, "grad_norm": 0.83203125, "learning_rate": 0.00011545000000000001, "loss": 0.9315, "step": 2310 }, { "contrastive_loss": 4.1455078125, "epoch": 0.27385892116182575, "mse_loss": 0.1054471954703331, "step": 2310 }, { "epoch": 0.27504445761707175, "grad_norm": 0.73046875, "learning_rate": 0.00011595, "loss": 0.9205, "step": 2320 }, { "contrastive_loss": 4.2100830078125, "epoch": 0.27504445761707175, "mse_loss": 0.14549806714057922, "step": 2320 }, { "epoch": 0.27622999407231774, "grad_norm": 0.7578125, "learning_rate": 0.00011645000000000001, "loss": 0.943, "step": 2330 }, { "contrastive_loss": 4.1688232421875, "epoch": 0.27622999407231774, "mse_loss": 0.13455815613269806, "step": 2330 }, { "epoch": 0.27741553052756374, "grad_norm": 1.078125, "learning_rate": 0.00011695000000000001, "loss": 0.9526, "step": 2340 }, { "contrastive_loss": 4.112060546875, "epoch": 0.27741553052756374, "mse_loss": 0.072291798889637, "step": 2340 }, { "epoch": 0.27860106698280973, "grad_norm": 0.72265625, "learning_rate": 0.00011745000000000001, "loss": 0.9529, "step": 2350 }, { "contrastive_loss": 4.1024169921875, "epoch": 0.27860106698280973, "mse_loss": 0.13696914911270142, "step": 2350 }, { "epoch": 0.2797866034380557, "grad_norm": 0.78515625, "learning_rate": 0.00011795000000000001, "loss": 0.9299, "step": 2360 }, { "contrastive_loss": 4.3265380859375, "epoch": 0.2797866034380557, "mse_loss": 0.09104227274656296, "step": 2360 }, { "epoch": 0.2809721398933017, "grad_norm": 0.60546875, "learning_rate": 0.00011845000000000002, "loss": 0.9301, "step": 2370 }, { "contrastive_loss": 4.1385498046875, "epoch": 0.2809721398933017, "mse_loss": 0.09500539302825928, "step": 2370 }, { "epoch": 0.2821576763485477, "grad_norm": 0.6328125, "learning_rate": 0.00011895, "loss": 0.9279, "step": 2380 }, { "contrastive_loss": 4.1937255859375, "epoch": 0.2821576763485477, "mse_loss": 0.08759429305791855, "step": 2380 }, { "epoch": 0.2833432128037937, "grad_norm": 0.86328125, "learning_rate": 0.00011944999999999999, "loss": 0.9305, "step": 2390 }, { "contrastive_loss": 4.1182861328125, "epoch": 0.2833432128037937, "mse_loss": 0.1020248606801033, "step": 2390 }, { "epoch": 0.2845287492590397, "grad_norm": 0.71484375, "learning_rate": 0.00011995, "loss": 0.9403, "step": 2400 }, { "contrastive_loss": 4.1707763671875, "epoch": 0.2845287492590397, "mse_loss": 0.09623008966445923, "step": 2400 }, { "epoch": 0.2857142857142857, "grad_norm": 0.7578125, "learning_rate": 0.00012045, "loss": 0.9243, "step": 2410 }, { "contrastive_loss": 4.1795654296875, "epoch": 0.2857142857142857, "mse_loss": 0.07955305278301239, "step": 2410 }, { "epoch": 0.2868998221695317, "grad_norm": 1.1796875, "learning_rate": 0.00012095000000000001, "loss": 0.9409, "step": 2420 }, { "contrastive_loss": 4.1649169921875, "epoch": 0.2868998221695317, "mse_loss": 0.12195749580860138, "step": 2420 }, { "epoch": 0.2880853586247777, "grad_norm": 0.8515625, "learning_rate": 0.00012145, "loss": 0.9345, "step": 2430 }, { "contrastive_loss": 4.0960693359375, "epoch": 0.2880853586247777, "mse_loss": 0.10818871110677719, "step": 2430 }, { "epoch": 0.28927089508002374, "grad_norm": 0.86328125, "learning_rate": 0.00012195000000000001, "loss": 0.9369, "step": 2440 }, { "contrastive_loss": 4.25390625, "epoch": 0.28927089508002374, "mse_loss": 0.11904717981815338, "step": 2440 }, { "epoch": 0.29045643153526973, "grad_norm": 0.71484375, "learning_rate": 0.00012245, "loss": 0.9312, "step": 2450 }, { "contrastive_loss": 4.3038330078125, "epoch": 0.29045643153526973, "mse_loss": 0.11727198213338852, "step": 2450 }, { "epoch": 0.2916419679905157, "grad_norm": 0.87109375, "learning_rate": 0.00012295, "loss": 0.9307, "step": 2460 }, { "contrastive_loss": 4.1104736328125, "epoch": 0.2916419679905157, "mse_loss": 0.09358099848031998, "step": 2460 }, { "epoch": 0.2928275044457617, "grad_norm": 0.7578125, "learning_rate": 0.00012345, "loss": 0.9259, "step": 2470 }, { "contrastive_loss": 4.0499267578125, "epoch": 0.2928275044457617, "mse_loss": 0.07992824167013168, "step": 2470 }, { "epoch": 0.2940130409010077, "grad_norm": 0.8125, "learning_rate": 0.00012395, "loss": 0.915, "step": 2480 }, { "contrastive_loss": 4.173095703125, "epoch": 0.2940130409010077, "mse_loss": 0.09342525899410248, "step": 2480 }, { "epoch": 0.2951985773562537, "grad_norm": 0.7890625, "learning_rate": 0.00012445, "loss": 0.9147, "step": 2490 }, { "contrastive_loss": 4.2012939453125, "epoch": 0.2951985773562537, "mse_loss": 0.10439717769622803, "step": 2490 }, { "epoch": 0.2963841138114997, "grad_norm": 1.3046875, "learning_rate": 0.00012495, "loss": 0.934, "step": 2500 }, { "contrastive_loss": 4.04638671875, "epoch": 0.2963841138114997, "mse_loss": 0.10154183954000473, "step": 2500 }, { "epoch": 0.2975696502667457, "grad_norm": 0.8203125, "learning_rate": 0.00012545, "loss": 0.9221, "step": 2510 }, { "contrastive_loss": 4.1107177734375, "epoch": 0.2975696502667457, "mse_loss": 0.09549711644649506, "step": 2510 }, { "epoch": 0.2987551867219917, "grad_norm": 0.7734375, "learning_rate": 0.00012595000000000003, "loss": 0.9236, "step": 2520 }, { "contrastive_loss": 4.24267578125, "epoch": 0.2987551867219917, "mse_loss": 0.09776052087545395, "step": 2520 }, { "epoch": 0.2999407231772377, "grad_norm": 0.7421875, "learning_rate": 0.00012645, "loss": 0.9283, "step": 2530 }, { "contrastive_loss": 4.16259765625, "epoch": 0.2999407231772377, "mse_loss": 0.06647392362356186, "step": 2530 }, { "epoch": 0.3011262596324837, "grad_norm": 0.82421875, "learning_rate": 0.00012695000000000002, "loss": 0.9258, "step": 2540 }, { "contrastive_loss": 4.116455078125, "epoch": 0.3011262596324837, "mse_loss": 0.08860443532466888, "step": 2540 }, { "epoch": 0.3023117960877297, "grad_norm": 0.72265625, "learning_rate": 0.00012745, "loss": 0.9308, "step": 2550 }, { "contrastive_loss": 4.2393798828125, "epoch": 0.3023117960877297, "mse_loss": 0.09423919767141342, "step": 2550 }, { "epoch": 0.3034973325429757, "grad_norm": 0.80859375, "learning_rate": 0.00012795000000000002, "loss": 0.9369, "step": 2560 }, { "contrastive_loss": 4.0579833984375, "epoch": 0.3034973325429757, "mse_loss": 0.11453592777252197, "step": 2560 }, { "epoch": 0.30468286899822167, "grad_norm": 0.92578125, "learning_rate": 0.00012845, "loss": 0.9433, "step": 2570 }, { "contrastive_loss": 4.1441650390625, "epoch": 0.30468286899822167, "mse_loss": 0.12784495949745178, "step": 2570 }, { "epoch": 0.3058684054534677, "grad_norm": 0.65234375, "learning_rate": 0.00012895000000000002, "loss": 0.9436, "step": 2580 }, { "contrastive_loss": 4.2041015625, "epoch": 0.3058684054534677, "mse_loss": 0.09077877551317215, "step": 2580 }, { "epoch": 0.3070539419087137, "grad_norm": 0.85546875, "learning_rate": 0.00012945, "loss": 0.926, "step": 2590 }, { "contrastive_loss": 4.190673828125, "epoch": 0.3070539419087137, "mse_loss": 0.08934297412633896, "step": 2590 }, { "epoch": 0.3082394783639597, "grad_norm": 1.15625, "learning_rate": 0.00012995000000000001, "loss": 0.9239, "step": 2600 }, { "contrastive_loss": 4.1075439453125, "epoch": 0.3082394783639597, "mse_loss": 0.07681616395711899, "step": 2600 }, { "epoch": 0.3094250148192057, "grad_norm": 0.84765625, "learning_rate": 0.00013045, "loss": 0.918, "step": 2610 }, { "contrastive_loss": 4.041015625, "epoch": 0.3094250148192057, "mse_loss": 0.07501175254583359, "step": 2610 }, { "epoch": 0.3106105512744517, "grad_norm": 0.921875, "learning_rate": 0.00013095, "loss": 0.9073, "step": 2620 }, { "contrastive_loss": 4.141845703125, "epoch": 0.3106105512744517, "mse_loss": 0.07861142605543137, "step": 2620 }, { "epoch": 0.3117960877296977, "grad_norm": 0.6484375, "learning_rate": 0.00013145, "loss": 0.9226, "step": 2630 }, { "contrastive_loss": 3.96435546875, "epoch": 0.3117960877296977, "mse_loss": 0.09910057485103607, "step": 2630 }, { "epoch": 0.3129816241849437, "grad_norm": 0.74609375, "learning_rate": 0.00013195, "loss": 0.9138, "step": 2640 }, { "contrastive_loss": 4.1943359375, "epoch": 0.3129816241849437, "mse_loss": 0.07982921600341797, "step": 2640 }, { "epoch": 0.3141671606401897, "grad_norm": 0.82421875, "learning_rate": 0.00013245, "loss": 0.9264, "step": 2650 }, { "contrastive_loss": 4.080810546875, "epoch": 0.3141671606401897, "mse_loss": 0.16498132050037384, "step": 2650 }, { "epoch": 0.3153526970954357, "grad_norm": 0.66015625, "learning_rate": 0.00013295, "loss": 0.9301, "step": 2660 }, { "contrastive_loss": 4.0474853515625, "epoch": 0.3153526970954357, "mse_loss": 0.1296045184135437, "step": 2660 }, { "epoch": 0.31653823355068167, "grad_norm": 0.66796875, "learning_rate": 0.00013345000000000002, "loss": 0.9159, "step": 2670 }, { "contrastive_loss": 3.9180908203125, "epoch": 0.31653823355068167, "mse_loss": 0.1191863939166069, "step": 2670 }, { "epoch": 0.31772377000592766, "grad_norm": 0.58203125, "learning_rate": 0.00013395, "loss": 0.9219, "step": 2680 }, { "contrastive_loss": 4.1751708984375, "epoch": 0.31772377000592766, "mse_loss": 0.12837398052215576, "step": 2680 }, { "epoch": 0.31890930646117366, "grad_norm": 0.9765625, "learning_rate": 0.00013445000000000002, "loss": 0.9212, "step": 2690 }, { "contrastive_loss": 4.051025390625, "epoch": 0.31890930646117366, "mse_loss": 0.11364573985338211, "step": 2690 }, { "epoch": 0.32009484291641965, "grad_norm": 1.078125, "learning_rate": 0.00013495, "loss": 0.9367, "step": 2700 }, { "contrastive_loss": 3.9892578125, "epoch": 0.32009484291641965, "mse_loss": 0.11066421121358871, "step": 2700 }, { "epoch": 0.3212803793716657, "grad_norm": 0.85546875, "learning_rate": 0.00013545, "loss": 0.9249, "step": 2710 }, { "contrastive_loss": 4.049560546875, "epoch": 0.3212803793716657, "mse_loss": 0.1116080954670906, "step": 2710 }, { "epoch": 0.3224659158269117, "grad_norm": 0.97265625, "learning_rate": 0.00013595, "loss": 0.9226, "step": 2720 }, { "contrastive_loss": 4.085693359375, "epoch": 0.3224659158269117, "mse_loss": 0.11677588522434235, "step": 2720 }, { "epoch": 0.3236514522821577, "grad_norm": 0.8125, "learning_rate": 0.00013645, "loss": 0.9258, "step": 2730 }, { "contrastive_loss": 4.1217041015625, "epoch": 0.3236514522821577, "mse_loss": 0.12062796205282211, "step": 2730 }, { "epoch": 0.3248369887374037, "grad_norm": 0.98046875, "learning_rate": 0.00013695, "loss": 0.9253, "step": 2740 }, { "contrastive_loss": 4.1990966796875, "epoch": 0.3248369887374037, "mse_loss": 0.10972123593091965, "step": 2740 }, { "epoch": 0.3260225251926497, "grad_norm": 0.7421875, "learning_rate": 0.00013745, "loss": 0.905, "step": 2750 }, { "contrastive_loss": 4.201171875, "epoch": 0.3260225251926497, "mse_loss": 0.14234612882137299, "step": 2750 }, { "epoch": 0.3272080616478957, "grad_norm": 0.5859375, "learning_rate": 0.00013795, "loss": 0.9156, "step": 2760 }, { "contrastive_loss": 4.0716552734375, "epoch": 0.3272080616478957, "mse_loss": 0.11335514485836029, "step": 2760 }, { "epoch": 0.32839359810314167, "grad_norm": 1.046875, "learning_rate": 0.00013845, "loss": 0.9193, "step": 2770 }, { "contrastive_loss": 4.194580078125, "epoch": 0.32839359810314167, "mse_loss": 0.09445101767778397, "step": 2770 }, { "epoch": 0.32957913455838767, "grad_norm": 0.76171875, "learning_rate": 0.00013895, "loss": 0.9292, "step": 2780 }, { "contrastive_loss": 4.2110595703125, "epoch": 0.32957913455838767, "mse_loss": 0.134410098195076, "step": 2780 }, { "epoch": 0.33076467101363366, "grad_norm": 0.58203125, "learning_rate": 0.00013945, "loss": 0.9306, "step": 2790 }, { "contrastive_loss": 4.1082763671875, "epoch": 0.33076467101363366, "mse_loss": 0.12694312632083893, "step": 2790 }, { "epoch": 0.33195020746887965, "grad_norm": 0.73828125, "learning_rate": 0.00013995000000000001, "loss": 0.918, "step": 2800 }, { "contrastive_loss": 4.057373046875, "epoch": 0.33195020746887965, "mse_loss": 0.09668927639722824, "step": 2800 }, { "epoch": 0.33313574392412565, "grad_norm": 1.046875, "learning_rate": 0.00014045000000000003, "loss": 0.9289, "step": 2810 }, { "contrastive_loss": 4.0596923828125, "epoch": 0.33313574392412565, "mse_loss": 0.0879218801856041, "step": 2810 }, { "epoch": 0.33432128037937164, "grad_norm": 0.8671875, "learning_rate": 0.00014095, "loss": 0.9214, "step": 2820 }, { "contrastive_loss": 4.106689453125, "epoch": 0.33432128037937164, "mse_loss": 0.08467002958059311, "step": 2820 }, { "epoch": 0.33550681683461764, "grad_norm": 0.91796875, "learning_rate": 0.00014145000000000002, "loss": 0.9078, "step": 2830 }, { "contrastive_loss": 4.06396484375, "epoch": 0.33550681683461764, "mse_loss": 0.09941147267818451, "step": 2830 }, { "epoch": 0.3366923532898637, "grad_norm": 0.9765625, "learning_rate": 0.00014195, "loss": 0.9125, "step": 2840 }, { "contrastive_loss": 4.11669921875, "epoch": 0.3366923532898637, "mse_loss": 0.0979636088013649, "step": 2840 }, { "epoch": 0.3378778897451097, "grad_norm": 0.7890625, "learning_rate": 0.00014245000000000002, "loss": 0.9196, "step": 2850 }, { "contrastive_loss": 4.1146240234375, "epoch": 0.3378778897451097, "mse_loss": 0.10780799388885498, "step": 2850 }, { "epoch": 0.3390634262003557, "grad_norm": 0.6640625, "learning_rate": 0.00014295, "loss": 0.9142, "step": 2860 }, { "contrastive_loss": 4.1497802734375, "epoch": 0.3390634262003557, "mse_loss": 0.07327040284872055, "step": 2860 }, { "epoch": 0.34024896265560167, "grad_norm": 0.59375, "learning_rate": 0.00014345000000000002, "loss": 0.9253, "step": 2870 }, { "contrastive_loss": 4.1048583984375, "epoch": 0.34024896265560167, "mse_loss": 0.1151822954416275, "step": 2870 }, { "epoch": 0.34143449911084767, "grad_norm": 0.82421875, "learning_rate": 0.00014395, "loss": 0.9243, "step": 2880 }, { "contrastive_loss": 4.0675048828125, "epoch": 0.34143449911084767, "mse_loss": 0.0838247537612915, "step": 2880 }, { "epoch": 0.34262003556609366, "grad_norm": 0.80078125, "learning_rate": 0.00014445, "loss": 0.9155, "step": 2890 }, { "contrastive_loss": 4.20068359375, "epoch": 0.34262003556609366, "mse_loss": 0.07073401659727097, "step": 2890 }, { "epoch": 0.34380557202133966, "grad_norm": 1.0234375, "learning_rate": 0.00014495, "loss": 0.9168, "step": 2900 }, { "contrastive_loss": 4.0311279296875, "epoch": 0.34380557202133966, "mse_loss": 0.14056892693042755, "step": 2900 }, { "epoch": 0.34499110847658565, "grad_norm": 0.8203125, "learning_rate": 0.00014544999999999998, "loss": 0.937, "step": 2910 }, { "contrastive_loss": 4.1070556640625, "epoch": 0.34499110847658565, "mse_loss": 0.09510018676519394, "step": 2910 }, { "epoch": 0.34617664493183165, "grad_norm": 1.203125, "learning_rate": 0.00014595, "loss": 0.9155, "step": 2920 }, { "contrastive_loss": 4.0753173828125, "epoch": 0.34617664493183165, "mse_loss": 0.10056906193494797, "step": 2920 }, { "epoch": 0.34736218138707764, "grad_norm": 0.796875, "learning_rate": 0.00014645, "loss": 0.9214, "step": 2930 }, { "contrastive_loss": 4.28662109375, "epoch": 0.34736218138707764, "mse_loss": 0.10941477119922638, "step": 2930 }, { "epoch": 0.34854771784232363, "grad_norm": 0.8046875, "learning_rate": 0.00014695000000000002, "loss": 0.908, "step": 2940 }, { "contrastive_loss": 4.1661376953125, "epoch": 0.34854771784232363, "mse_loss": 0.08876342326402664, "step": 2940 }, { "epoch": 0.34973325429756963, "grad_norm": 0.6640625, "learning_rate": 0.00014745, "loss": 0.9181, "step": 2950 }, { "contrastive_loss": 4.168212890625, "epoch": 0.34973325429756963, "mse_loss": 0.09709695726633072, "step": 2950 }, { "epoch": 0.3509187907528156, "grad_norm": 1.125, "learning_rate": 0.00014795000000000002, "loss": 0.9221, "step": 2960 }, { "contrastive_loss": 4.1435546875, "epoch": 0.3509187907528156, "mse_loss": 0.08089554309844971, "step": 2960 }, { "epoch": 0.3521043272080617, "grad_norm": 0.8125, "learning_rate": 0.00014845, "loss": 0.921, "step": 2970 }, { "contrastive_loss": 4.033447265625, "epoch": 0.3521043272080617, "mse_loss": 0.10814835131168365, "step": 2970 }, { "epoch": 0.35328986366330767, "grad_norm": 0.90234375, "learning_rate": 0.00014895000000000002, "loss": 0.914, "step": 2980 }, { "contrastive_loss": 4.0733642578125, "epoch": 0.35328986366330767, "mse_loss": 0.08581329137086868, "step": 2980 }, { "epoch": 0.35447540011855366, "grad_norm": 0.53515625, "learning_rate": 0.00014945, "loss": 0.9229, "step": 2990 }, { "contrastive_loss": 4.0294189453125, "epoch": 0.35447540011855366, "mse_loss": 0.08236070722341537, "step": 2990 }, { "epoch": 0.35566093657379966, "grad_norm": 0.74609375, "learning_rate": 0.00014995, "loss": 0.9201, "step": 3000 }, { "contrastive_loss": 4.080078125, "epoch": 0.35566093657379966, "mse_loss": 0.08455308526754379, "step": 3000 }, { "epoch": 0.35684647302904565, "grad_norm": 0.515625, "learning_rate": 0.00015045, "loss": 0.9076, "step": 3010 }, { "contrastive_loss": 4.1895751953125, "epoch": 0.35684647302904565, "mse_loss": 0.06355051696300507, "step": 3010 }, { "epoch": 0.35803200948429165, "grad_norm": 0.91015625, "learning_rate": 0.00015095, "loss": 0.9155, "step": 3020 }, { "contrastive_loss": 4.114501953125, "epoch": 0.35803200948429165, "mse_loss": 0.07370946556329727, "step": 3020 }, { "epoch": 0.35921754593953764, "grad_norm": 0.70703125, "learning_rate": 0.00015145, "loss": 0.915, "step": 3030 }, { "contrastive_loss": 4.06689453125, "epoch": 0.35921754593953764, "mse_loss": 0.08008497208356857, "step": 3030 }, { "epoch": 0.36040308239478364, "grad_norm": 0.55859375, "learning_rate": 0.00015195, "loss": 0.8968, "step": 3040 }, { "contrastive_loss": 4.03515625, "epoch": 0.36040308239478364, "mse_loss": 0.06228696554899216, "step": 3040 }, { "epoch": 0.36158861885002963, "grad_norm": 1.3671875, "learning_rate": 0.00015245, "loss": 0.9066, "step": 3050 }, { "contrastive_loss": 4.208740234375, "epoch": 0.36158861885002963, "mse_loss": 0.12831713259220123, "step": 3050 }, { "epoch": 0.3627741553052756, "grad_norm": 0.60546875, "learning_rate": 0.00015295, "loss": 0.9176, "step": 3060 }, { "contrastive_loss": 3.9603271484375, "epoch": 0.3627741553052756, "mse_loss": 0.14974510669708252, "step": 3060 }, { "epoch": 0.3639596917605216, "grad_norm": 0.734375, "learning_rate": 0.00015345000000000002, "loss": 0.9135, "step": 3070 }, { "contrastive_loss": 4.0780029296875, "epoch": 0.3639596917605216, "mse_loss": 0.1219206303358078, "step": 3070 }, { "epoch": 0.3651452282157676, "grad_norm": 0.87109375, "learning_rate": 0.00015395000000000003, "loss": 0.9202, "step": 3080 }, { "contrastive_loss": 3.947021484375, "epoch": 0.3651452282157676, "mse_loss": 0.09065096080303192, "step": 3080 }, { "epoch": 0.3663307646710136, "grad_norm": 0.69140625, "learning_rate": 0.00015445000000000001, "loss": 0.9113, "step": 3090 }, { "contrastive_loss": 3.9986572265625, "epoch": 0.3663307646710136, "mse_loss": 0.09589196741580963, "step": 3090 }, { "epoch": 0.36751630112625966, "grad_norm": 0.7578125, "learning_rate": 0.00015495000000000003, "loss": 0.9208, "step": 3100 }, { "contrastive_loss": 4.0753173828125, "epoch": 0.36751630112625966, "mse_loss": 0.13686999678611755, "step": 3100 }, { "epoch": 0.36870183758150565, "grad_norm": 0.78125, "learning_rate": 0.00015545, "loss": 0.9285, "step": 3110 }, { "contrastive_loss": 3.983642578125, "epoch": 0.36870183758150565, "mse_loss": 0.12604930996894836, "step": 3110 }, { "epoch": 0.36988737403675165, "grad_norm": 0.6953125, "learning_rate": 0.00015595000000000002, "loss": 0.922, "step": 3120 }, { "contrastive_loss": 3.973388671875, "epoch": 0.36988737403675165, "mse_loss": 0.13886938989162445, "step": 3120 }, { "epoch": 0.37107291049199764, "grad_norm": 0.57421875, "learning_rate": 0.00015645, "loss": 0.928, "step": 3130 }, { "contrastive_loss": 4.0697021484375, "epoch": 0.37107291049199764, "mse_loss": 0.09008538722991943, "step": 3130 }, { "epoch": 0.37225844694724364, "grad_norm": 0.76953125, "learning_rate": 0.00015695, "loss": 0.9136, "step": 3140 }, { "contrastive_loss": 4.160888671875, "epoch": 0.37225844694724364, "mse_loss": 0.10017406940460205, "step": 3140 }, { "epoch": 0.37344398340248963, "grad_norm": 0.58984375, "learning_rate": 0.00015745, "loss": 0.9217, "step": 3150 }, { "contrastive_loss": 4.17041015625, "epoch": 0.37344398340248963, "mse_loss": 0.09836184978485107, "step": 3150 }, { "epoch": 0.3746295198577356, "grad_norm": 0.71484375, "learning_rate": 0.00015795, "loss": 0.9288, "step": 3160 }, { "contrastive_loss": 4.041259765625, "epoch": 0.3746295198577356, "mse_loss": 0.09394023567438126, "step": 3160 }, { "epoch": 0.3758150563129816, "grad_norm": 0.62109375, "learning_rate": 0.00015845, "loss": 0.901, "step": 3170 }, { "contrastive_loss": 4.046142578125, "epoch": 0.3758150563129816, "mse_loss": 0.10193105041980743, "step": 3170 }, { "epoch": 0.3770005927682276, "grad_norm": 0.58984375, "learning_rate": 0.00015895, "loss": 0.9094, "step": 3180 }, { "contrastive_loss": 4.1051025390625, "epoch": 0.3770005927682276, "mse_loss": 0.12234655767679214, "step": 3180 }, { "epoch": 0.3781861292234736, "grad_norm": 0.80859375, "learning_rate": 0.00015945, "loss": 0.9186, "step": 3190 }, { "contrastive_loss": 4.0322265625, "epoch": 0.3781861292234736, "mse_loss": 0.12175304442644119, "step": 3190 }, { "epoch": 0.3793716656787196, "grad_norm": 0.74609375, "learning_rate": 0.00015995, "loss": 0.9225, "step": 3200 }, { "contrastive_loss": 4.08837890625, "epoch": 0.3793716656787196, "mse_loss": 0.11290944367647171, "step": 3200 }, { "epoch": 0.3805572021339656, "grad_norm": 0.62890625, "learning_rate": 0.00016045000000000002, "loss": 0.9015, "step": 3210 }, { "contrastive_loss": 4.1136474609375, "epoch": 0.3805572021339656, "mse_loss": 0.07840144634246826, "step": 3210 }, { "epoch": 0.3817427385892116, "grad_norm": 0.6953125, "learning_rate": 0.00016095, "loss": 0.9103, "step": 3220 }, { "contrastive_loss": 4.189208984375, "epoch": 0.3817427385892116, "mse_loss": 0.11225994676351547, "step": 3220 }, { "epoch": 0.38292827504445764, "grad_norm": 0.640625, "learning_rate": 0.00016145000000000002, "loss": 0.9135, "step": 3230 }, { "contrastive_loss": 4.1279296875, "epoch": 0.38292827504445764, "mse_loss": 0.06411908566951752, "step": 3230 }, { "epoch": 0.38411381149970364, "grad_norm": 0.65625, "learning_rate": 0.00016195, "loss": 0.8995, "step": 3240 }, { "contrastive_loss": 4.1324462890625, "epoch": 0.38411381149970364, "mse_loss": 0.08717727661132812, "step": 3240 }, { "epoch": 0.38529934795494963, "grad_norm": 0.69140625, "learning_rate": 0.00016245000000000002, "loss": 0.9163, "step": 3250 }, { "contrastive_loss": 4.201904296875, "epoch": 0.38529934795494963, "mse_loss": 0.07212595641613007, "step": 3250 }, { "epoch": 0.38648488441019563, "grad_norm": 0.76171875, "learning_rate": 0.00016295, "loss": 0.9224, "step": 3260 }, { "contrastive_loss": 4.133056640625, "epoch": 0.38648488441019563, "mse_loss": 0.08621302992105484, "step": 3260 }, { "epoch": 0.3876704208654416, "grad_norm": 0.859375, "learning_rate": 0.00016345000000000002, "loss": 0.9123, "step": 3270 }, { "contrastive_loss": 3.95263671875, "epoch": 0.3876704208654416, "mse_loss": 0.09338728338479996, "step": 3270 }, { "epoch": 0.3888559573206876, "grad_norm": 0.6796875, "learning_rate": 0.00016395, "loss": 0.9092, "step": 3280 }, { "contrastive_loss": 4.201904296875, "epoch": 0.3888559573206876, "mse_loss": 0.1006946936249733, "step": 3280 }, { "epoch": 0.3900414937759336, "grad_norm": 0.8046875, "learning_rate": 0.00016445, "loss": 0.9195, "step": 3290 }, { "contrastive_loss": 3.9390869140625, "epoch": 0.3900414937759336, "mse_loss": 0.1150117963552475, "step": 3290 }, { "epoch": 0.3912270302311796, "grad_norm": 0.671875, "learning_rate": 0.00016495, "loss": 0.9086, "step": 3300 }, { "contrastive_loss": 4.100341796875, "epoch": 0.3912270302311796, "mse_loss": 0.09393102675676346, "step": 3300 }, { "epoch": 0.3924125666864256, "grad_norm": 0.91015625, "learning_rate": 0.00016545, "loss": 0.9139, "step": 3310 }, { "contrastive_loss": 4.1309814453125, "epoch": 0.3924125666864256, "mse_loss": 0.08961351960897446, "step": 3310 }, { "epoch": 0.3935981031416716, "grad_norm": 0.7421875, "learning_rate": 0.00016595, "loss": 0.9199, "step": 3320 }, { "contrastive_loss": 4.126953125, "epoch": 0.3935981031416716, "mse_loss": 0.0747634768486023, "step": 3320 }, { "epoch": 0.3947836395969176, "grad_norm": 0.70703125, "learning_rate": 0.00016645, "loss": 0.9173, "step": 3330 }, { "contrastive_loss": 4.127685546875, "epoch": 0.3947836395969176, "mse_loss": 0.09172222763299942, "step": 3330 }, { "epoch": 0.3959691760521636, "grad_norm": 0.6796875, "learning_rate": 0.00016695000000000002, "loss": 0.9085, "step": 3340 }, { "contrastive_loss": 4.0966796875, "epoch": 0.3959691760521636, "mse_loss": 0.16327519714832306, "step": 3340 }, { "epoch": 0.3971547125074096, "grad_norm": 0.74609375, "learning_rate": 0.00016745, "loss": 0.9243, "step": 3350 }, { "contrastive_loss": 4.225830078125, "epoch": 0.3971547125074096, "mse_loss": 0.09614782780408859, "step": 3350 }, { "epoch": 0.3983402489626556, "grad_norm": 0.80078125, "learning_rate": 0.00016795000000000002, "loss": 0.9343, "step": 3360 }, { "contrastive_loss": 4.118408203125, "epoch": 0.3983402489626556, "mse_loss": 0.11181510984897614, "step": 3360 }, { "epoch": 0.3995257854179016, "grad_norm": 0.8125, "learning_rate": 0.00016845000000000003, "loss": 0.929, "step": 3370 }, { "contrastive_loss": 4.1014404296875, "epoch": 0.3995257854179016, "mse_loss": 0.11331654340028763, "step": 3370 }, { "epoch": 0.4007113218731476, "grad_norm": 0.6875, "learning_rate": 0.00016895000000000001, "loss": 0.92, "step": 3380 }, { "contrastive_loss": 4.24755859375, "epoch": 0.4007113218731476, "mse_loss": 0.10119782388210297, "step": 3380 }, { "epoch": 0.4018968583283936, "grad_norm": 1.796875, "learning_rate": 0.00016945, "loss": 0.9342, "step": 3390 }, { "contrastive_loss": 4.126220703125, "epoch": 0.4018968583283936, "mse_loss": 0.11726045608520508, "step": 3390 }, { "epoch": 0.4030823947836396, "grad_norm": 0.875, "learning_rate": 0.00016995, "loss": 0.9399, "step": 3400 }, { "contrastive_loss": 4.0177001953125, "epoch": 0.4030823947836396, "mse_loss": 0.1355299949645996, "step": 3400 }, { "epoch": 0.4042679312388856, "grad_norm": 0.80078125, "learning_rate": 0.00017045, "loss": 0.9478, "step": 3410 }, { "contrastive_loss": 4.3665771484375, "epoch": 0.4042679312388856, "mse_loss": 0.13617165386676788, "step": 3410 }, { "epoch": 0.4054534676941316, "grad_norm": 0.7265625, "learning_rate": 0.00017095, "loss": 0.9316, "step": 3420 }, { "contrastive_loss": 3.9686279296875, "epoch": 0.4054534676941316, "mse_loss": 0.11073071509599686, "step": 3420 }, { "epoch": 0.4066390041493776, "grad_norm": 0.7421875, "learning_rate": 0.00017145, "loss": 0.9245, "step": 3430 }, { "contrastive_loss": 3.9547119140625, "epoch": 0.4066390041493776, "mse_loss": 0.10522333532571793, "step": 3430 }, { "epoch": 0.4078245406046236, "grad_norm": 0.91015625, "learning_rate": 0.00017195, "loss": 0.922, "step": 3440 }, { "contrastive_loss": 4.053466796875, "epoch": 0.4078245406046236, "mse_loss": 0.1134205013513565, "step": 3440 }, { "epoch": 0.4090100770598696, "grad_norm": 0.64453125, "learning_rate": 0.00017245, "loss": 0.9156, "step": 3450 }, { "contrastive_loss": 4.0853271484375, "epoch": 0.4090100770598696, "mse_loss": 0.10865376889705658, "step": 3450 }, { "epoch": 0.4101956135151156, "grad_norm": 1.1796875, "learning_rate": 0.00017295, "loss": 0.9351, "step": 3460 }, { "contrastive_loss": 4.1336669921875, "epoch": 0.4101956135151156, "mse_loss": 0.08827009052038193, "step": 3460 }, { "epoch": 0.41138114997036157, "grad_norm": 0.73046875, "learning_rate": 0.00017345000000000001, "loss": 0.9125, "step": 3470 }, { "contrastive_loss": 4.027099609375, "epoch": 0.41138114997036157, "mse_loss": 0.0930965319275856, "step": 3470 }, { "epoch": 0.41256668642560756, "grad_norm": 0.6640625, "learning_rate": 0.00017395, "loss": 0.9256, "step": 3480 }, { "contrastive_loss": 3.98486328125, "epoch": 0.41256668642560756, "mse_loss": 0.09234724938869476, "step": 3480 }, { "epoch": 0.41375222288085356, "grad_norm": 0.68359375, "learning_rate": 0.00017445, "loss": 0.9272, "step": 3490 }, { "contrastive_loss": 4.1212158203125, "epoch": 0.41375222288085356, "mse_loss": 0.12837612628936768, "step": 3490 }, { "epoch": 0.4149377593360996, "grad_norm": 0.65625, "learning_rate": 0.00017495000000000002, "loss": 0.9307, "step": 3500 }, { "contrastive_loss": 4.009521484375, "epoch": 0.4149377593360996, "mse_loss": 0.10299235582351685, "step": 3500 }, { "epoch": 0.4161232957913456, "grad_norm": 0.6796875, "learning_rate": 0.00017545, "loss": 0.9218, "step": 3510 }, { "contrastive_loss": 4.1370849609375, "epoch": 0.4161232957913456, "mse_loss": 0.09344633668661118, "step": 3510 }, { "epoch": 0.4173088322465916, "grad_norm": 0.9609375, "learning_rate": 0.00017595000000000002, "loss": 0.922, "step": 3520 }, { "contrastive_loss": 4.103515625, "epoch": 0.4173088322465916, "mse_loss": 0.08716046065092087, "step": 3520 }, { "epoch": 0.4184943687018376, "grad_norm": 0.64453125, "learning_rate": 0.00017645, "loss": 0.9121, "step": 3530 }, { "contrastive_loss": 4.0733642578125, "epoch": 0.4184943687018376, "mse_loss": 0.09999170154333115, "step": 3530 }, { "epoch": 0.4196799051570836, "grad_norm": 0.68359375, "learning_rate": 0.00017695000000000002, "loss": 0.9263, "step": 3540 }, { "contrastive_loss": 4.138427734375, "epoch": 0.4196799051570836, "mse_loss": 0.11369039118289948, "step": 3540 }, { "epoch": 0.4208654416123296, "grad_norm": 0.55078125, "learning_rate": 0.00017745, "loss": 0.9157, "step": 3550 }, { "contrastive_loss": 4.1014404296875, "epoch": 0.4208654416123296, "mse_loss": 0.08885008096694946, "step": 3550 }, { "epoch": 0.4220509780675756, "grad_norm": 0.66015625, "learning_rate": 0.00017795000000000002, "loss": 0.921, "step": 3560 }, { "contrastive_loss": 4.0772705078125, "epoch": 0.4220509780675756, "mse_loss": 0.09464459121227264, "step": 3560 }, { "epoch": 0.42323651452282157, "grad_norm": 0.60546875, "learning_rate": 0.00017845, "loss": 0.9227, "step": 3570 }, { "contrastive_loss": 4.0074462890625, "epoch": 0.42323651452282157, "mse_loss": 0.07355610281229019, "step": 3570 }, { "epoch": 0.42442205097806757, "grad_norm": 0.6640625, "learning_rate": 0.00017895, "loss": 0.9094, "step": 3580 }, { "contrastive_loss": 3.980224609375, "epoch": 0.42442205097806757, "mse_loss": 0.12115359306335449, "step": 3580 }, { "epoch": 0.42560758743331356, "grad_norm": 0.62890625, "learning_rate": 0.00017945, "loss": 0.9021, "step": 3590 }, { "contrastive_loss": 4.1336669921875, "epoch": 0.42560758743331356, "mse_loss": 0.10456090420484543, "step": 3590 }, { "epoch": 0.42679312388855956, "grad_norm": 0.6328125, "learning_rate": 0.00017995, "loss": 0.907, "step": 3600 }, { "contrastive_loss": 4.1036376953125, "epoch": 0.42679312388855956, "mse_loss": 0.11601150780916214, "step": 3600 }, { "epoch": 0.42797866034380555, "grad_norm": 0.68359375, "learning_rate": 0.00018045, "loss": 0.916, "step": 3610 }, { "contrastive_loss": 4.1512451171875, "epoch": 0.42797866034380555, "mse_loss": 0.1271096020936966, "step": 3610 }, { "epoch": 0.42916419679905154, "grad_norm": 0.5234375, "learning_rate": 0.00018095, "loss": 0.9198, "step": 3620 }, { "contrastive_loss": 3.966064453125, "epoch": 0.42916419679905154, "mse_loss": 0.08115018904209137, "step": 3620 }, { "epoch": 0.4303497332542976, "grad_norm": 0.69140625, "learning_rate": 0.00018145000000000002, "loss": 0.9093, "step": 3630 }, { "contrastive_loss": 4.0655517578125, "epoch": 0.4303497332542976, "mse_loss": 0.13070158660411835, "step": 3630 }, { "epoch": 0.4315352697095436, "grad_norm": 0.66796875, "learning_rate": 0.00018195, "loss": 0.9086, "step": 3640 }, { "contrastive_loss": 4.121337890625, "epoch": 0.4315352697095436, "mse_loss": 0.07938522845506668, "step": 3640 }, { "epoch": 0.4327208061647896, "grad_norm": 0.65234375, "learning_rate": 0.00018245000000000002, "loss": 0.9178, "step": 3650 }, { "contrastive_loss": 4.1055908203125, "epoch": 0.4327208061647896, "mse_loss": 0.08913081139326096, "step": 3650 }, { "epoch": 0.4339063426200356, "grad_norm": 0.6796875, "learning_rate": 0.00018295, "loss": 0.9114, "step": 3660 }, { "contrastive_loss": 4.1387939453125, "epoch": 0.4339063426200356, "mse_loss": 0.09058559685945511, "step": 3660 }, { "epoch": 0.4350918790752816, "grad_norm": 0.51171875, "learning_rate": 0.00018345000000000001, "loss": 0.9118, "step": 3670 }, { "contrastive_loss": 3.985595703125, "epoch": 0.4350918790752816, "mse_loss": 0.09122901409864426, "step": 3670 }, { "epoch": 0.43627741553052757, "grad_norm": 0.78515625, "learning_rate": 0.00018395, "loss": 0.9169, "step": 3680 }, { "contrastive_loss": 4.0665283203125, "epoch": 0.43627741553052757, "mse_loss": 0.08188308775424957, "step": 3680 }, { "epoch": 0.43746295198577356, "grad_norm": 0.62890625, "learning_rate": 0.00018445, "loss": 0.9009, "step": 3690 }, { "contrastive_loss": 3.949951171875, "epoch": 0.43746295198577356, "mse_loss": 0.08264068514108658, "step": 3690 }, { "epoch": 0.43864848844101956, "grad_norm": 0.6484375, "learning_rate": 0.00018495, "loss": 0.8992, "step": 3700 }, { "contrastive_loss": 4.2147216796875, "epoch": 0.43864848844101956, "mse_loss": 0.10541795194149017, "step": 3700 }, { "epoch": 0.43983402489626555, "grad_norm": 0.6015625, "learning_rate": 0.00018545, "loss": 0.9233, "step": 3710 }, { "contrastive_loss": 4.128662109375, "epoch": 0.43983402489626555, "mse_loss": 0.07146850973367691, "step": 3710 }, { "epoch": 0.44101956135151155, "grad_norm": 1.046875, "learning_rate": 0.00018595, "loss": 0.911, "step": 3720 }, { "contrastive_loss": 4.1314697265625, "epoch": 0.44101956135151155, "mse_loss": 0.09614330530166626, "step": 3720 }, { "epoch": 0.44220509780675754, "grad_norm": 0.84375, "learning_rate": 0.00018645, "loss": 0.9084, "step": 3730 }, { "contrastive_loss": 4.0745849609375, "epoch": 0.44220509780675754, "mse_loss": 0.09659433364868164, "step": 3730 }, { "epoch": 0.44339063426200354, "grad_norm": 0.57421875, "learning_rate": 0.00018695, "loss": 0.9102, "step": 3740 }, { "contrastive_loss": 4.0584716796875, "epoch": 0.44339063426200354, "mse_loss": 0.05290510132908821, "step": 3740 }, { "epoch": 0.44457617071724953, "grad_norm": 0.5234375, "learning_rate": 0.00018745, "loss": 0.9067, "step": 3750 }, { "contrastive_loss": 4.13330078125, "epoch": 0.44457617071724953, "mse_loss": 0.06921229511499405, "step": 3750 }, { "epoch": 0.4457617071724956, "grad_norm": 0.66796875, "learning_rate": 0.00018795000000000001, "loss": 0.9107, "step": 3760 }, { "contrastive_loss": 4.141357421875, "epoch": 0.4457617071724956, "mse_loss": 0.09428645670413971, "step": 3760 }, { "epoch": 0.4469472436277416, "grad_norm": 0.78515625, "learning_rate": 0.00018845000000000003, "loss": 0.9245, "step": 3770 }, { "contrastive_loss": 3.8729248046875, "epoch": 0.4469472436277416, "mse_loss": 0.08555315434932709, "step": 3770 }, { "epoch": 0.44813278008298757, "grad_norm": 0.67578125, "learning_rate": 0.00018895, "loss": 0.9121, "step": 3780 }, { "contrastive_loss": 3.906982421875, "epoch": 0.44813278008298757, "mse_loss": 0.11373864114284515, "step": 3780 }, { "epoch": 0.44931831653823356, "grad_norm": 0.5703125, "learning_rate": 0.00018945000000000002, "loss": 0.8962, "step": 3790 }, { "contrastive_loss": 3.8436279296875, "epoch": 0.44931831653823356, "mse_loss": 0.10383045673370361, "step": 3790 }, { "epoch": 0.45050385299347956, "grad_norm": 0.87109375, "learning_rate": 0.00018995, "loss": 0.8974, "step": 3800 }, { "contrastive_loss": 4.0843505859375, "epoch": 0.45050385299347956, "mse_loss": 0.11736612766981125, "step": 3800 }, { "epoch": 0.45168938944872555, "grad_norm": 0.51171875, "learning_rate": 0.00019045000000000002, "loss": 0.8988, "step": 3810 }, { "contrastive_loss": 4.093505859375, "epoch": 0.45168938944872555, "mse_loss": 0.09193883836269379, "step": 3810 }, { "epoch": 0.45287492590397155, "grad_norm": 0.6015625, "learning_rate": 0.00019095, "loss": 0.9099, "step": 3820 }, { "contrastive_loss": 4.14697265625, "epoch": 0.45287492590397155, "mse_loss": 0.12842117249965668, "step": 3820 }, { "epoch": 0.45406046235921754, "grad_norm": 0.5390625, "learning_rate": 0.00019145000000000002, "loss": 0.9102, "step": 3830 }, { "contrastive_loss": 4.2430419921875, "epoch": 0.45406046235921754, "mse_loss": 0.08002772182226181, "step": 3830 }, { "epoch": 0.45524599881446354, "grad_norm": 0.58984375, "learning_rate": 0.00019195, "loss": 0.9165, "step": 3840 }, { "contrastive_loss": 4.0751953125, "epoch": 0.45524599881446354, "mse_loss": 0.11845382302999496, "step": 3840 }, { "epoch": 0.45643153526970953, "grad_norm": 0.5625, "learning_rate": 0.00019245000000000002, "loss": 0.9095, "step": 3850 }, { "contrastive_loss": 4.148193359375, "epoch": 0.45643153526970953, "mse_loss": 0.08966878801584244, "step": 3850 }, { "epoch": 0.4576170717249555, "grad_norm": 0.84765625, "learning_rate": 0.00019295, "loss": 0.9318, "step": 3860 }, { "contrastive_loss": 3.9681396484375, "epoch": 0.4576170717249555, "mse_loss": 0.1307077556848526, "step": 3860 }, { "epoch": 0.4588026081802015, "grad_norm": 0.75390625, "learning_rate": 0.00019345, "loss": 0.9142, "step": 3870 }, { "contrastive_loss": 4.1676025390625, "epoch": 0.4588026081802015, "mse_loss": 0.10310184955596924, "step": 3870 }, { "epoch": 0.4599881446354475, "grad_norm": 0.65625, "learning_rate": 0.00019395, "loss": 0.9011, "step": 3880 }, { "contrastive_loss": 3.958984375, "epoch": 0.4599881446354475, "mse_loss": 0.10802613198757172, "step": 3880 }, { "epoch": 0.46117368109069357, "grad_norm": 0.73828125, "learning_rate": 0.00019445, "loss": 0.9091, "step": 3890 }, { "contrastive_loss": 4.119873046875, "epoch": 0.46117368109069357, "mse_loss": 0.11622931063175201, "step": 3890 }, { "epoch": 0.46235921754593956, "grad_norm": 0.64453125, "learning_rate": 0.00019495000000000002, "loss": 0.9154, "step": 3900 }, { "contrastive_loss": 4.0643310546875, "epoch": 0.46235921754593956, "mse_loss": 0.10533808916807175, "step": 3900 }, { "epoch": 0.46354475400118555, "grad_norm": 0.69140625, "learning_rate": 0.00019545, "loss": 0.9056, "step": 3910 }, { "contrastive_loss": 4.075927734375, "epoch": 0.46354475400118555, "mse_loss": 0.09508102387189865, "step": 3910 }, { "epoch": 0.46473029045643155, "grad_norm": 1.0234375, "learning_rate": 0.00019595000000000002, "loss": 0.9059, "step": 3920 }, { "contrastive_loss": 4.218505859375, "epoch": 0.46473029045643155, "mse_loss": 0.1034964844584465, "step": 3920 }, { "epoch": 0.46591582691167754, "grad_norm": 0.6015625, "learning_rate": 0.00019645, "loss": 0.9226, "step": 3930 }, { "contrastive_loss": 4.0450439453125, "epoch": 0.46591582691167754, "mse_loss": 0.11729500442743301, "step": 3930 }, { "epoch": 0.46710136336692354, "grad_norm": 0.5859375, "learning_rate": 0.00019695000000000002, "loss": 0.9132, "step": 3940 }, { "contrastive_loss": 3.990966796875, "epoch": 0.46710136336692354, "mse_loss": 0.07509580999612808, "step": 3940 }, { "epoch": 0.46828689982216953, "grad_norm": 0.58203125, "learning_rate": 0.00019745, "loss": 0.9196, "step": 3950 }, { "contrastive_loss": 4.053955078125, "epoch": 0.46828689982216953, "mse_loss": 0.10210777819156647, "step": 3950 }, { "epoch": 0.46947243627741553, "grad_norm": 0.69140625, "learning_rate": 0.00019795000000000001, "loss": 0.8999, "step": 3960 }, { "contrastive_loss": 4.1002197265625, "epoch": 0.46947243627741553, "mse_loss": 0.10443031042814255, "step": 3960 }, { "epoch": 0.4706579727326615, "grad_norm": 0.78125, "learning_rate": 0.00019845, "loss": 0.9258, "step": 3970 }, { "contrastive_loss": 4.075927734375, "epoch": 0.4706579727326615, "mse_loss": 0.10543893277645111, "step": 3970 }, { "epoch": 0.4718435091879075, "grad_norm": 0.671875, "learning_rate": 0.00019895, "loss": 0.9164, "step": 3980 }, { "contrastive_loss": 4.1484375, "epoch": 0.4718435091879075, "mse_loss": 0.08579752594232559, "step": 3980 }, { "epoch": 0.4730290456431535, "grad_norm": 0.486328125, "learning_rate": 0.00019945, "loss": 0.9074, "step": 3990 }, { "contrastive_loss": 4.0001220703125, "epoch": 0.4730290456431535, "mse_loss": 0.10203082114458084, "step": 3990 }, { "epoch": 0.4742145820983995, "grad_norm": 0.59375, "learning_rate": 0.00019995, "loss": 0.9044, "step": 4000 }, { "contrastive_loss": 4.133544921875, "epoch": 0.4742145820983995, "mse_loss": 0.09986621141433716, "step": 4000 }, { "epoch": 0.4754001185536455, "grad_norm": 0.6484375, "learning_rate": 0.00019999999307965767, "loss": 0.9105, "step": 4010 }, { "contrastive_loss": 3.99658203125, "epoch": 0.4754001185536455, "mse_loss": 0.07952926307916641, "step": 4010 }, { "epoch": 0.47658565500889155, "grad_norm": 0.73828125, "learning_rate": 0.00019999996915748784, "loss": 0.9044, "step": 4020 }, { "contrastive_loss": 3.9595947265625, "epoch": 0.47658565500889155, "mse_loss": 0.09841399639844894, "step": 4020 }, { "epoch": 0.47777119146413755, "grad_norm": 0.5078125, "learning_rate": 0.00019999992814805827, "loss": 0.9162, "step": 4030 }, { "contrastive_loss": 4.052734375, "epoch": 0.47777119146413755, "mse_loss": 0.08763588964939117, "step": 4030 }, { "epoch": 0.47895672791938354, "grad_norm": 0.7734375, "learning_rate": 0.00019999987005137602, "loss": 0.9277, "step": 4040 }, { "contrastive_loss": 4.06689453125, "epoch": 0.47895672791938354, "mse_loss": 0.08135721832513809, "step": 4040 }, { "epoch": 0.48014226437462953, "grad_norm": 0.7734375, "learning_rate": 0.00019999979486745096, "loss": 0.8884, "step": 4050 }, { "contrastive_loss": 4.062744140625, "epoch": 0.48014226437462953, "mse_loss": 0.12895408272743225, "step": 4050 }, { "epoch": 0.48132780082987553, "grad_norm": 0.71484375, "learning_rate": 0.00019999970259629597, "loss": 0.9104, "step": 4060 }, { "contrastive_loss": 4.0755615234375, "epoch": 0.48132780082987553, "mse_loss": 0.09513301402330399, "step": 4060 }, { "epoch": 0.4825133372851215, "grad_norm": 0.5859375, "learning_rate": 0.0001999995932379268, "loss": 0.909, "step": 4070 }, { "contrastive_loss": 3.9466552734375, "epoch": 0.4825133372851215, "mse_loss": 0.07442797720432281, "step": 4070 }, { "epoch": 0.4836988737403675, "grad_norm": 0.6953125, "learning_rate": 0.00019999946679236214, "loss": 0.8931, "step": 4080 }, { "contrastive_loss": 3.956787109375, "epoch": 0.4836988737403675, "mse_loss": 0.12401874363422394, "step": 4080 }, { "epoch": 0.4848844101956135, "grad_norm": 0.734375, "learning_rate": 0.00019999932325962357, "loss": 0.8987, "step": 4090 }, { "contrastive_loss": 4.0406494140625, "epoch": 0.4848844101956135, "mse_loss": 0.08016599714756012, "step": 4090 }, { "epoch": 0.4860699466508595, "grad_norm": 0.55078125, "learning_rate": 0.00019999916263973568, "loss": 0.8972, "step": 4100 }, { "contrastive_loss": 4.130126953125, "epoch": 0.4860699466508595, "mse_loss": 0.1163664236664772, "step": 4100 }, { "epoch": 0.4872554831061055, "grad_norm": 0.58984375, "learning_rate": 0.00019999898493272585, "loss": 0.9015, "step": 4110 }, { "contrastive_loss": 4.0999755859375, "epoch": 0.4872554831061055, "mse_loss": 0.0965876579284668, "step": 4110 }, { "epoch": 0.4884410195613515, "grad_norm": 0.61328125, "learning_rate": 0.00019999879013862448, "loss": 0.9059, "step": 4120 }, { "contrastive_loss": 3.991455078125, "epoch": 0.4884410195613515, "mse_loss": 0.0675886794924736, "step": 4120 }, { "epoch": 0.4896265560165975, "grad_norm": 0.59375, "learning_rate": 0.00019999857825746487, "loss": 0.9091, "step": 4130 }, { "contrastive_loss": 4.042236328125, "epoch": 0.4896265560165975, "mse_loss": 0.10280900448560715, "step": 4130 }, { "epoch": 0.4908120924718435, "grad_norm": 0.5703125, "learning_rate": 0.00019999834928928318, "loss": 0.9122, "step": 4140 }, { "contrastive_loss": 3.99072265625, "epoch": 0.4908120924718435, "mse_loss": 0.1214645728468895, "step": 4140 }, { "epoch": 0.4919976289270895, "grad_norm": 0.671875, "learning_rate": 0.00019999810323411858, "loss": 0.9065, "step": 4150 }, { "contrastive_loss": 4.086181640625, "epoch": 0.4919976289270895, "mse_loss": 0.06178551912307739, "step": 4150 }, { "epoch": 0.49318316538233553, "grad_norm": 0.5859375, "learning_rate": 0.00019999784009201306, "loss": 0.9009, "step": 4160 }, { "contrastive_loss": 4.0809326171875, "epoch": 0.49318316538233553, "mse_loss": 0.1264384537935257, "step": 4160 }, { "epoch": 0.4943687018375815, "grad_norm": 0.51171875, "learning_rate": 0.00019999755986301163, "loss": 0.9098, "step": 4170 }, { "contrastive_loss": 4.1707763671875, "epoch": 0.4943687018375815, "mse_loss": 0.09478934854269028, "step": 4170 }, { "epoch": 0.4955542382928275, "grad_norm": 0.62109375, "learning_rate": 0.00019999726254716217, "loss": 0.9046, "step": 4180 }, { "contrastive_loss": 4.034912109375, "epoch": 0.4955542382928275, "mse_loss": 0.09427099674940109, "step": 4180 }, { "epoch": 0.4967397747480735, "grad_norm": 0.48046875, "learning_rate": 0.00019999694814451546, "loss": 0.9044, "step": 4190 }, { "contrastive_loss": 4.1546630859375, "epoch": 0.4967397747480735, "mse_loss": 0.08956383913755417, "step": 4190 }, { "epoch": 0.4979253112033195, "grad_norm": 0.64453125, "learning_rate": 0.00019999661665512524, "loss": 0.9066, "step": 4200 }, { "contrastive_loss": 4.1539306640625, "epoch": 0.4979253112033195, "mse_loss": 0.08178234100341797, "step": 4200 }, { "epoch": 0.4991108476585655, "grad_norm": 0.59375, "learning_rate": 0.00019999626807904814, "loss": 0.9019, "step": 4210 }, { "contrastive_loss": 4.1136474609375, "epoch": 0.4991108476585655, "mse_loss": 0.07516860961914062, "step": 4210 }, { "epoch": 0.5002963841138115, "grad_norm": 0.59375, "learning_rate": 0.00019999590241634373, "loss": 0.8983, "step": 4220 }, { "contrastive_loss": 3.974609375, "epoch": 0.5002963841138115, "mse_loss": 0.10501842200756073, "step": 4220 }, { "epoch": 0.5014819205690575, "grad_norm": 0.5703125, "learning_rate": 0.0001999955196670745, "loss": 0.8967, "step": 4230 }, { "contrastive_loss": 4.156005859375, "epoch": 0.5014819205690575, "mse_loss": 0.08760775625705719, "step": 4230 }, { "epoch": 0.5026674570243035, "grad_norm": 0.515625, "learning_rate": 0.00019999511983130583, "loss": 0.9102, "step": 4240 }, { "contrastive_loss": 4.06298828125, "epoch": 0.5026674570243035, "mse_loss": 0.07732134312391281, "step": 4240 }, { "epoch": 0.5038529934795495, "grad_norm": 0.474609375, "learning_rate": 0.00019999470290910605, "loss": 0.9094, "step": 4250 }, { "contrastive_loss": 4.0496826171875, "epoch": 0.5038529934795495, "mse_loss": 0.08357816189527512, "step": 4250 }, { "epoch": 0.5050385299347955, "grad_norm": 0.60546875, "learning_rate": 0.0001999942689005464, "loss": 0.9023, "step": 4260 }, { "contrastive_loss": 3.9691162109375, "epoch": 0.5050385299347955, "mse_loss": 0.08907872438430786, "step": 4260 }, { "epoch": 0.5062240663900415, "grad_norm": 0.7265625, "learning_rate": 0.00019999381780570107, "loss": 0.9056, "step": 4270 }, { "contrastive_loss": 3.9488525390625, "epoch": 0.5062240663900415, "mse_loss": 0.08910180628299713, "step": 4270 }, { "epoch": 0.5074096028452875, "grad_norm": 0.640625, "learning_rate": 0.0001999933496246471, "loss": 0.8915, "step": 4280 }, { "contrastive_loss": 4.19482421875, "epoch": 0.5074096028452875, "mse_loss": 0.08402635157108307, "step": 4280 }, { "epoch": 0.5085951393005335, "grad_norm": 0.51953125, "learning_rate": 0.0001999928643574645, "loss": 0.8981, "step": 4290 }, { "contrastive_loss": 4.033203125, "epoch": 0.5085951393005335, "mse_loss": 0.16273391246795654, "step": 4290 }, { "epoch": 0.5097806757557795, "grad_norm": 0.60546875, "learning_rate": 0.00019999236200423618, "loss": 0.9084, "step": 4300 }, { "contrastive_loss": 3.993896484375, "epoch": 0.5097806757557795, "mse_loss": 0.07304084300994873, "step": 4300 }, { "epoch": 0.5109662122110255, "grad_norm": 0.52734375, "learning_rate": 0.00019999184256504804, "loss": 0.8927, "step": 4310 }, { "contrastive_loss": 4.007080078125, "epoch": 0.5109662122110255, "mse_loss": 0.11508337408304214, "step": 4310 }, { "epoch": 0.5121517486662714, "grad_norm": 0.6328125, "learning_rate": 0.00019999130603998874, "loss": 0.8942, "step": 4320 }, { "contrastive_loss": 3.95654296875, "epoch": 0.5121517486662714, "mse_loss": 0.10657723993062973, "step": 4320 }, { "epoch": 0.5133372851215174, "grad_norm": 0.69921875, "learning_rate": 0.00019999075242915003, "loss": 0.8991, "step": 4330 }, { "contrastive_loss": 4.066162109375, "epoch": 0.5133372851215174, "mse_loss": 0.08128596842288971, "step": 4330 }, { "epoch": 0.5145228215767634, "grad_norm": 0.61328125, "learning_rate": 0.00019999018173262647, "loss": 0.8985, "step": 4340 }, { "contrastive_loss": 4.1102294921875, "epoch": 0.5145228215767634, "mse_loss": 0.08420556038618088, "step": 4340 }, { "epoch": 0.5157083580320095, "grad_norm": 0.69921875, "learning_rate": 0.0001999895939505156, "loss": 0.9109, "step": 4350 }, { "contrastive_loss": 4.07861328125, "epoch": 0.5157083580320095, "mse_loss": 0.09366200864315033, "step": 4350 }, { "epoch": 0.5168938944872555, "grad_norm": 0.61328125, "learning_rate": 0.00019998898908291782, "loss": 0.909, "step": 4360 }, { "contrastive_loss": 4.0245361328125, "epoch": 0.5168938944872555, "mse_loss": 0.10329040139913559, "step": 4360 }, { "epoch": 0.5180794309425015, "grad_norm": 0.59375, "learning_rate": 0.00019998836712993654, "loss": 0.8976, "step": 4370 }, { "contrastive_loss": 4.0181884765625, "epoch": 0.5180794309425015, "mse_loss": 0.06395865231752396, "step": 4370 }, { "epoch": 0.5192649673977475, "grad_norm": 0.431640625, "learning_rate": 0.00019998772809167798, "loss": 0.8948, "step": 4380 }, { "contrastive_loss": 3.875, "epoch": 0.5192649673977475, "mse_loss": 0.08682440966367722, "step": 4380 }, { "epoch": 0.5204505038529935, "grad_norm": 0.609375, "learning_rate": 0.00019998707196825137, "loss": 0.8895, "step": 4390 }, { "contrastive_loss": 4.2178955078125, "epoch": 0.5204505038529935, "mse_loss": 0.10673367977142334, "step": 4390 }, { "epoch": 0.5216360403082395, "grad_norm": 0.58984375, "learning_rate": 0.00019998639875976884, "loss": 0.9249, "step": 4400 }, { "contrastive_loss": 4.0283203125, "epoch": 0.5216360403082395, "mse_loss": 0.10114451497793198, "step": 4400 }, { "epoch": 0.5228215767634855, "grad_norm": 0.52734375, "learning_rate": 0.00019998570846634537, "loss": 0.9052, "step": 4410 }, { "contrastive_loss": 3.9234619140625, "epoch": 0.5228215767634855, "mse_loss": 0.08521365374326706, "step": 4410 }, { "epoch": 0.5240071132187315, "grad_norm": 0.5546875, "learning_rate": 0.00019998500108809895, "loss": 0.8984, "step": 4420 }, { "contrastive_loss": 4.0692138671875, "epoch": 0.5240071132187315, "mse_loss": 0.10638834536075592, "step": 4420 }, { "epoch": 0.5251926496739775, "grad_norm": 0.56640625, "learning_rate": 0.0001999842766251504, "loss": 0.9036, "step": 4430 }, { "contrastive_loss": 3.9476318359375, "epoch": 0.5251926496739775, "mse_loss": 0.08467444032430649, "step": 4430 }, { "epoch": 0.5263781861292235, "grad_norm": 0.73046875, "learning_rate": 0.0001999835350776236, "loss": 0.896, "step": 4440 }, { "contrastive_loss": 4.0821533203125, "epoch": 0.5263781861292235, "mse_loss": 0.06903039664030075, "step": 4440 }, { "epoch": 0.5275637225844695, "grad_norm": 0.6875, "learning_rate": 0.0001999827764456452, "loss": 0.894, "step": 4450 }, { "contrastive_loss": 4.0037841796875, "epoch": 0.5275637225844695, "mse_loss": 0.09038983285427094, "step": 4450 }, { "epoch": 0.5287492590397155, "grad_norm": 0.75390625, "learning_rate": 0.00019998200072934483, "loss": 0.9051, "step": 4460 }, { "contrastive_loss": 4.0372314453125, "epoch": 0.5287492590397155, "mse_loss": 0.0979473665356636, "step": 4460 }, { "epoch": 0.5299347954949615, "grad_norm": 0.67578125, "learning_rate": 0.00019998120792885505, "loss": 0.9002, "step": 4470 }, { "contrastive_loss": 3.9666748046875, "epoch": 0.5299347954949615, "mse_loss": 0.06993796676397324, "step": 4470 }, { "epoch": 0.5311203319502075, "grad_norm": 0.51171875, "learning_rate": 0.00019998039804431132, "loss": 0.9024, "step": 4480 }, { "contrastive_loss": 4.0203857421875, "epoch": 0.5311203319502075, "mse_loss": 0.10714704543352127, "step": 4480 }, { "epoch": 0.5323058684054535, "grad_norm": 0.8515625, "learning_rate": 0.00019997957107585203, "loss": 0.904, "step": 4490 }, { "contrastive_loss": 3.97900390625, "epoch": 0.5323058684054535, "mse_loss": 0.05539511516690254, "step": 4490 }, { "epoch": 0.5334914048606995, "grad_norm": 0.57421875, "learning_rate": 0.00019997872702361851, "loss": 0.8843, "step": 4500 }, { "contrastive_loss": 4.030029296875, "epoch": 0.5334914048606995, "mse_loss": 0.10205431282520294, "step": 4500 }, { "epoch": 0.5346769413159455, "grad_norm": 0.484375, "learning_rate": 0.00019997786588775494, "loss": 0.9203, "step": 4510 }, { "contrastive_loss": 4.10595703125, "epoch": 0.5346769413159455, "mse_loss": 0.07843028008937836, "step": 4510 }, { "epoch": 0.5358624777711914, "grad_norm": 0.490234375, "learning_rate": 0.00019997698766840852, "loss": 0.9073, "step": 4520 }, { "contrastive_loss": 3.984130859375, "epoch": 0.5358624777711914, "mse_loss": 0.1173563003540039, "step": 4520 }, { "epoch": 0.5370480142264374, "grad_norm": 0.61328125, "learning_rate": 0.0001999760923657293, "loss": 0.8973, "step": 4530 }, { "contrastive_loss": 4.112548828125, "epoch": 0.5370480142264374, "mse_loss": 0.10803462564945221, "step": 4530 }, { "epoch": 0.5382335506816834, "grad_norm": 0.54296875, "learning_rate": 0.0001999751799798702, "loss": 0.8912, "step": 4540 }, { "contrastive_loss": 4.03857421875, "epoch": 0.5382335506816834, "mse_loss": 0.08935708552598953, "step": 4540 }, { "epoch": 0.5394190871369294, "grad_norm": 0.474609375, "learning_rate": 0.0001999742505109872, "loss": 0.8878, "step": 4550 }, { "contrastive_loss": 4.15380859375, "epoch": 0.5394190871369294, "mse_loss": 0.092686228454113, "step": 4550 }, { "epoch": 0.5406046235921754, "grad_norm": 0.515625, "learning_rate": 0.0001999733039592391, "loss": 0.8958, "step": 4560 }, { "contrastive_loss": 4.231201171875, "epoch": 0.5406046235921754, "mse_loss": 0.10412076860666275, "step": 4560 }, { "epoch": 0.5417901600474214, "grad_norm": 0.412109375, "learning_rate": 0.00019997234032478759, "loss": 0.8964, "step": 4570 }, { "contrastive_loss": 3.9122314453125, "epoch": 0.5417901600474214, "mse_loss": 0.09769036620855331, "step": 4570 }, { "epoch": 0.5429756965026674, "grad_norm": 0.625, "learning_rate": 0.00019997135960779738, "loss": 0.8902, "step": 4580 }, { "contrastive_loss": 4.092041015625, "epoch": 0.5429756965026674, "mse_loss": 0.10547403246164322, "step": 4580 }, { "epoch": 0.5441612329579134, "grad_norm": 0.46875, "learning_rate": 0.00019997036180843605, "loss": 0.9011, "step": 4590 }, { "contrastive_loss": 3.95654296875, "epoch": 0.5441612329579134, "mse_loss": 0.08604361116886139, "step": 4590 }, { "epoch": 0.5453467694131594, "grad_norm": 0.51171875, "learning_rate": 0.00019996934692687407, "loss": 0.8966, "step": 4600 }, { "contrastive_loss": 4.1468505859375, "epoch": 0.5453467694131594, "mse_loss": 0.09285395592451096, "step": 4600 }, { "epoch": 0.5465323058684054, "grad_norm": 0.6328125, "learning_rate": 0.00019996831496328486, "loss": 0.9006, "step": 4610 }, { "contrastive_loss": 3.9710693359375, "epoch": 0.5465323058684054, "mse_loss": 0.09043087810277939, "step": 4610 }, { "epoch": 0.5477178423236515, "grad_norm": 0.486328125, "learning_rate": 0.00019996726591784477, "loss": 0.8939, "step": 4620 }, { "contrastive_loss": 3.9859619140625, "epoch": 0.5477178423236515, "mse_loss": 0.062602698802948, "step": 4620 }, { "epoch": 0.5489033787788975, "grad_norm": 0.6015625, "learning_rate": 0.00019996619979073305, "loss": 0.8981, "step": 4630 }, { "contrastive_loss": 3.9801025390625, "epoch": 0.5489033787788975, "mse_loss": 0.09071660041809082, "step": 4630 }, { "epoch": 0.5500889152341435, "grad_norm": 0.58984375, "learning_rate": 0.00019996511658213186, "loss": 0.8963, "step": 4640 }, { "contrastive_loss": 3.923828125, "epoch": 0.5500889152341435, "mse_loss": 0.06724435836076736, "step": 4640 }, { "epoch": 0.5512744516893895, "grad_norm": 0.7109375, "learning_rate": 0.00019996401629222631, "loss": 0.8911, "step": 4650 }, { "contrastive_loss": 3.8138427734375, "epoch": 0.5512744516893895, "mse_loss": 0.08496362715959549, "step": 4650 }, { "epoch": 0.5524599881446355, "grad_norm": 0.6953125, "learning_rate": 0.00019996289892120438, "loss": 0.9026, "step": 4660 }, { "contrastive_loss": 3.905029296875, "epoch": 0.5524599881446355, "mse_loss": 0.0840877965092659, "step": 4660 }, { "epoch": 0.5536455245998815, "grad_norm": 0.62890625, "learning_rate": 0.00019996176446925704, "loss": 0.8775, "step": 4670 }, { "contrastive_loss": 4.0233154296875, "epoch": 0.5536455245998815, "mse_loss": 0.0892411321401596, "step": 4670 }, { "epoch": 0.5548310610551275, "grad_norm": 0.50390625, "learning_rate": 0.0001999606129365781, "loss": 0.8753, "step": 4680 }, { "contrastive_loss": 4.0809326171875, "epoch": 0.5548310610551275, "mse_loss": 0.10882217437028885, "step": 4680 }, { "epoch": 0.5560165975103735, "grad_norm": 0.73046875, "learning_rate": 0.00019995944432336433, "loss": 0.8995, "step": 4690 }, { "contrastive_loss": 3.9422607421875, "epoch": 0.5560165975103735, "mse_loss": 0.08080612123012543, "step": 4690 }, { "epoch": 0.5572021339656195, "grad_norm": 0.51953125, "learning_rate": 0.00019995825862981543, "loss": 0.8953, "step": 4700 }, { "contrastive_loss": 3.9869384765625, "epoch": 0.5572021339656195, "mse_loss": 0.12826408445835114, "step": 4700 }, { "epoch": 0.5583876704208655, "grad_norm": 0.43359375, "learning_rate": 0.000199957055856134, "loss": 0.8921, "step": 4710 }, { "contrastive_loss": 4.01611328125, "epoch": 0.5583876704208655, "mse_loss": 0.08900080621242523, "step": 4710 }, { "epoch": 0.5595732068761115, "grad_norm": 0.6484375, "learning_rate": 0.00019995583600252554, "loss": 0.8943, "step": 4720 }, { "contrastive_loss": 4.030029296875, "epoch": 0.5595732068761115, "mse_loss": 0.08232937753200531, "step": 4720 }, { "epoch": 0.5607587433313574, "grad_norm": 0.6484375, "learning_rate": 0.00019995459906919853, "loss": 0.8936, "step": 4730 }, { "contrastive_loss": 4.04736328125, "epoch": 0.5607587433313574, "mse_loss": 0.07257894426584244, "step": 4730 }, { "epoch": 0.5619442797866034, "grad_norm": 0.4921875, "learning_rate": 0.0001999533450563643, "loss": 0.8851, "step": 4740 }, { "contrastive_loss": 4.06201171875, "epoch": 0.5619442797866034, "mse_loss": 0.08597172051668167, "step": 4740 }, { "epoch": 0.5631298162418494, "grad_norm": 0.51171875, "learning_rate": 0.0001999520739642371, "loss": 0.9063, "step": 4750 }, { "contrastive_loss": 4.071044921875, "epoch": 0.5631298162418494, "mse_loss": 0.0934813991189003, "step": 4750 }, { "epoch": 0.5643153526970954, "grad_norm": 0.3984375, "learning_rate": 0.0001999507857930342, "loss": 0.8892, "step": 4760 }, { "contrastive_loss": 4.105224609375, "epoch": 0.5643153526970954, "mse_loss": 0.07303284853696823, "step": 4760 }, { "epoch": 0.5655008891523414, "grad_norm": 0.498046875, "learning_rate": 0.00019994948054297563, "loss": 0.8948, "step": 4770 }, { "contrastive_loss": 4.0087890625, "epoch": 0.5655008891523414, "mse_loss": 0.12382686883211136, "step": 4770 }, { "epoch": 0.5666864256075874, "grad_norm": 0.47265625, "learning_rate": 0.00019994815821428445, "loss": 0.902, "step": 4780 }, { "contrastive_loss": 4.061279296875, "epoch": 0.5666864256075874, "mse_loss": 0.11396132409572601, "step": 4780 }, { "epoch": 0.5678719620628334, "grad_norm": 0.50390625, "learning_rate": 0.00019994681880718663, "loss": 0.892, "step": 4790 }, { "contrastive_loss": 4.1346435546875, "epoch": 0.5678719620628334, "mse_loss": 0.07462068647146225, "step": 4790 }, { "epoch": 0.5690574985180794, "grad_norm": 0.51171875, "learning_rate": 0.00019994546232191104, "loss": 0.9032, "step": 4800 }, { "contrastive_loss": 4.070068359375, "epoch": 0.5690574985180794, "mse_loss": 0.0727568045258522, "step": 4800 }, { "epoch": 0.5702430349733254, "grad_norm": 0.875, "learning_rate": 0.00019994408875868947, "loss": 0.8934, "step": 4810 }, { "contrastive_loss": 4.117431640625, "epoch": 0.5702430349733254, "mse_loss": 0.1141321137547493, "step": 4810 }, { "epoch": 0.5714285714285714, "grad_norm": 0.625, "learning_rate": 0.00019994269811775657, "loss": 0.906, "step": 4820 }, { "contrastive_loss": 4.01513671875, "epoch": 0.5714285714285714, "mse_loss": 0.1008860245347023, "step": 4820 }, { "epoch": 0.5726141078838174, "grad_norm": 0.5234375, "learning_rate": 0.00019994129039935002, "loss": 0.8964, "step": 4830 }, { "contrastive_loss": 4.115966796875, "epoch": 0.5726141078838174, "mse_loss": 0.12503373622894287, "step": 4830 }, { "epoch": 0.5737996443390634, "grad_norm": 0.75, "learning_rate": 0.00019993986560371034, "loss": 0.9132, "step": 4840 }, { "contrastive_loss": 4.0711669921875, "epoch": 0.5737996443390634, "mse_loss": 0.09221605211496353, "step": 4840 }, { "epoch": 0.5749851807943094, "grad_norm": 0.58203125, "learning_rate": 0.000199938423731081, "loss": 0.9026, "step": 4850 }, { "contrastive_loss": 3.9638671875, "epoch": 0.5749851807943094, "mse_loss": 0.08438567817211151, "step": 4850 }, { "epoch": 0.5761707172495554, "grad_norm": 0.671875, "learning_rate": 0.00019993696478170833, "loss": 0.8993, "step": 4860 }, { "contrastive_loss": 4.0257568359375, "epoch": 0.5761707172495554, "mse_loss": 0.060534585267305374, "step": 4860 }, { "epoch": 0.5773562537048014, "grad_norm": 0.53125, "learning_rate": 0.0001999354887558417, "loss": 0.8832, "step": 4870 }, { "contrastive_loss": 4.08642578125, "epoch": 0.5773562537048014, "mse_loss": 0.0882234126329422, "step": 4870 }, { "epoch": 0.5785417901600475, "grad_norm": 0.58203125, "learning_rate": 0.00019993399565373327, "loss": 0.8912, "step": 4880 }, { "contrastive_loss": 4.0718994140625, "epoch": 0.5785417901600475, "mse_loss": 0.06884758174419403, "step": 4880 }, { "epoch": 0.5797273266152935, "grad_norm": 0.546875, "learning_rate": 0.00019993248547563817, "loss": 0.898, "step": 4890 }, { "contrastive_loss": 4.01513671875, "epoch": 0.5797273266152935, "mse_loss": 0.09094120562076569, "step": 4890 }, { "epoch": 0.5809128630705395, "grad_norm": 0.52734375, "learning_rate": 0.0001999309582218145, "loss": 0.8952, "step": 4900 }, { "contrastive_loss": 4.1275634765625, "epoch": 0.5809128630705395, "mse_loss": 0.10562551021575928, "step": 4900 }, { "epoch": 0.5820983995257855, "grad_norm": 0.5546875, "learning_rate": 0.00019992941389252315, "loss": 0.8837, "step": 4910 }, { "contrastive_loss": 3.971923828125, "epoch": 0.5820983995257855, "mse_loss": 0.08586413413286209, "step": 4910 }, { "epoch": 0.5832839359810315, "grad_norm": 0.61328125, "learning_rate": 0.00019992785248802806, "loss": 0.8907, "step": 4920 }, { "contrastive_loss": 3.9786376953125, "epoch": 0.5832839359810315, "mse_loss": 0.12609784305095673, "step": 4920 }, { "epoch": 0.5844694724362774, "grad_norm": 0.53515625, "learning_rate": 0.00019992627400859601, "loss": 0.8873, "step": 4930 }, { "contrastive_loss": 3.996826171875, "epoch": 0.5844694724362774, "mse_loss": 0.0708441287279129, "step": 4930 }, { "epoch": 0.5856550088915234, "grad_norm": 0.546875, "learning_rate": 0.00019992467845449672, "loss": 0.886, "step": 4940 }, { "contrastive_loss": 4.208251953125, "epoch": 0.5856550088915234, "mse_loss": 0.0696384459733963, "step": 4940 }, { "epoch": 0.5868405453467694, "grad_norm": 0.5234375, "learning_rate": 0.00019992306582600281, "loss": 0.9051, "step": 4950 }, { "contrastive_loss": 4.169921875, "epoch": 0.5868405453467694, "mse_loss": 0.08407063782215118, "step": 4950 }, { "epoch": 0.5880260818020154, "grad_norm": 0.515625, "learning_rate": 0.00019992143612338988, "loss": 0.8932, "step": 4960 }, { "contrastive_loss": 4.024658203125, "epoch": 0.5880260818020154, "mse_loss": 0.09194784611463547, "step": 4960 }, { "epoch": 0.5892116182572614, "grad_norm": 0.5390625, "learning_rate": 0.00019991978934693635, "loss": 0.9052, "step": 4970 }, { "contrastive_loss": 4.2420654296875, "epoch": 0.5892116182572614, "mse_loss": 0.06364916265010834, "step": 4970 }, { "epoch": 0.5903971547125074, "grad_norm": 0.796875, "learning_rate": 0.00019991812549692366, "loss": 0.8974, "step": 4980 }, { "contrastive_loss": 3.9775390625, "epoch": 0.5903971547125074, "mse_loss": 0.07183890789747238, "step": 4980 }, { "epoch": 0.5915826911677534, "grad_norm": 0.625, "learning_rate": 0.00019991644457363606, "loss": 0.8893, "step": 4990 }, { "contrastive_loss": 3.93359375, "epoch": 0.5915826911677534, "mse_loss": 0.08192384243011475, "step": 4990 }, { "epoch": 0.5927682276229994, "grad_norm": 0.447265625, "learning_rate": 0.0001999147465773608, "loss": 0.893, "step": 5000 }, { "contrastive_loss": 3.9586181640625, "epoch": 0.5927682276229994, "mse_loss": 0.10005556046962738, "step": 5000 }, { "epoch": 0.5939537640782454, "grad_norm": 0.5625, "learning_rate": 0.00019991303150838804, "loss": 0.8963, "step": 5010 }, { "contrastive_loss": 3.8736572265625, "epoch": 0.5939537640782454, "mse_loss": 0.05638090893626213, "step": 5010 }, { "epoch": 0.5951393005334914, "grad_norm": 0.56640625, "learning_rate": 0.00019991129936701083, "loss": 0.8892, "step": 5020 }, { "contrastive_loss": 4.0693359375, "epoch": 0.5951393005334914, "mse_loss": 0.0785897821187973, "step": 5020 }, { "epoch": 0.5963248369887374, "grad_norm": 0.73828125, "learning_rate": 0.00019990955015352513, "loss": 0.896, "step": 5030 }, { "contrastive_loss": 4.0440673828125, "epoch": 0.5963248369887374, "mse_loss": 0.09172405302524567, "step": 5030 }, { "epoch": 0.5975103734439834, "grad_norm": 0.451171875, "learning_rate": 0.00019990778386822986, "loss": 0.8864, "step": 5040 }, { "contrastive_loss": 4.000732421875, "epoch": 0.5975103734439834, "mse_loss": 0.09617932885885239, "step": 5040 }, { "epoch": 0.5986959098992294, "grad_norm": 0.55859375, "learning_rate": 0.00019990600051142678, "loss": 0.8899, "step": 5050 }, { "contrastive_loss": 3.9891357421875, "epoch": 0.5986959098992294, "mse_loss": 0.08430637419223785, "step": 5050 }, { "epoch": 0.5998814463544754, "grad_norm": 0.5703125, "learning_rate": 0.00019990420008342069, "loss": 0.8856, "step": 5060 }, { "contrastive_loss": 4.0181884765625, "epoch": 0.5998814463544754, "mse_loss": 0.08420503884553909, "step": 5060 }, { "epoch": 0.6010669828097214, "grad_norm": 0.66015625, "learning_rate": 0.00019990238258451912, "loss": 0.8865, "step": 5070 }, { "contrastive_loss": 4.123046875, "epoch": 0.6010669828097214, "mse_loss": 0.09524980932474136, "step": 5070 }, { "epoch": 0.6022525192649674, "grad_norm": 0.65234375, "learning_rate": 0.00019990054801503275, "loss": 0.884, "step": 5080 }, { "contrastive_loss": 3.919677734375, "epoch": 0.6022525192649674, "mse_loss": 0.053328268229961395, "step": 5080 }, { "epoch": 0.6034380557202134, "grad_norm": 0.671875, "learning_rate": 0.00019989869637527502, "loss": 0.8997, "step": 5090 }, { "contrastive_loss": 3.9515380859375, "epoch": 0.6034380557202134, "mse_loss": 0.0875898078083992, "step": 5090 }, { "epoch": 0.6046235921754594, "grad_norm": 0.478515625, "learning_rate": 0.0001998968276655623, "loss": 0.8915, "step": 5100 }, { "contrastive_loss": 4.1104736328125, "epoch": 0.6046235921754594, "mse_loss": 0.09458056837320328, "step": 5100 }, { "epoch": 0.6058091286307054, "grad_norm": 0.58984375, "learning_rate": 0.0001998949418862139, "loss": 0.8975, "step": 5110 }, { "contrastive_loss": 4.0225830078125, "epoch": 0.6058091286307054, "mse_loss": 0.12264806777238846, "step": 5110 }, { "epoch": 0.6069946650859513, "grad_norm": 0.609375, "learning_rate": 0.00019989303903755209, "loss": 0.9023, "step": 5120 }, { "contrastive_loss": 3.930908203125, "epoch": 0.6069946650859513, "mse_loss": 0.07088694721460342, "step": 5120 }, { "epoch": 0.6081802015411973, "grad_norm": 0.83203125, "learning_rate": 0.00019989111911990199, "loss": 0.8829, "step": 5130 }, { "contrastive_loss": 3.99853515625, "epoch": 0.6081802015411973, "mse_loss": 0.08572258055210114, "step": 5130 }, { "epoch": 0.6093657379964433, "grad_norm": 0.59765625, "learning_rate": 0.00019988918213359163, "loss": 0.9023, "step": 5140 }, { "contrastive_loss": 4.01806640625, "epoch": 0.6093657379964433, "mse_loss": 0.06641493737697601, "step": 5140 }, { "epoch": 0.6105512744516894, "grad_norm": 0.796875, "learning_rate": 0.00019988722807895207, "loss": 0.88, "step": 5150 }, { "contrastive_loss": 4.0697021484375, "epoch": 0.6105512744516894, "mse_loss": 0.07310134172439575, "step": 5150 }, { "epoch": 0.6117368109069354, "grad_norm": 0.7578125, "learning_rate": 0.00019988525695631708, "loss": 0.8995, "step": 5160 }, { "contrastive_loss": 3.9366455078125, "epoch": 0.6117368109069354, "mse_loss": 0.0682346373796463, "step": 5160 }, { "epoch": 0.6129223473621814, "grad_norm": 0.73828125, "learning_rate": 0.0001998832687660236, "loss": 0.8716, "step": 5170 }, { "contrastive_loss": 3.81884765625, "epoch": 0.6129223473621814, "mse_loss": 0.08023589104413986, "step": 5170 }, { "epoch": 0.6141078838174274, "grad_norm": 0.54296875, "learning_rate": 0.0001998812635084113, "loss": 0.8935, "step": 5180 }, { "contrastive_loss": 4.0706787109375, "epoch": 0.6141078838174274, "mse_loss": 0.07575637847185135, "step": 5180 }, { "epoch": 0.6152934202726734, "grad_norm": 0.50390625, "learning_rate": 0.0001998792411838228, "loss": 0.8998, "step": 5190 }, { "contrastive_loss": 3.8902587890625, "epoch": 0.6152934202726734, "mse_loss": 0.09060332924127579, "step": 5190 }, { "epoch": 0.6164789567279194, "grad_norm": 0.5, "learning_rate": 0.0001998772017926037, "loss": 0.8913, "step": 5200 }, { "contrastive_loss": 4.05078125, "epoch": 0.6164789567279194, "mse_loss": 0.09357309341430664, "step": 5200 }, { "epoch": 0.6176644931831654, "grad_norm": 0.48046875, "learning_rate": 0.00019987514533510245, "loss": 0.8847, "step": 5210 }, { "contrastive_loss": 4.0028076171875, "epoch": 0.6176644931831654, "mse_loss": 0.0995769053697586, "step": 5210 }, { "epoch": 0.6188500296384114, "grad_norm": 0.5, "learning_rate": 0.00019987307181167045, "loss": 0.8779, "step": 5220 }, { "contrastive_loss": 3.849609375, "epoch": 0.6188500296384114, "mse_loss": 0.0990225151181221, "step": 5220 }, { "epoch": 0.6200355660936574, "grad_norm": 0.53125, "learning_rate": 0.00019987098122266204, "loss": 0.8798, "step": 5230 }, { "contrastive_loss": 4.10400390625, "epoch": 0.6200355660936574, "mse_loss": 0.07589863240718842, "step": 5230 }, { "epoch": 0.6212211025489034, "grad_norm": 0.765625, "learning_rate": 0.00019986887356843438, "loss": 0.8914, "step": 5240 }, { "contrastive_loss": 3.977783203125, "epoch": 0.6212211025489034, "mse_loss": 0.11522074788808823, "step": 5240 }, { "epoch": 0.6224066390041494, "grad_norm": 0.60546875, "learning_rate": 0.00019986674884934767, "loss": 0.8809, "step": 5250 }, { "contrastive_loss": 4.0247802734375, "epoch": 0.6224066390041494, "mse_loss": 0.0939270406961441, "step": 5250 }, { "epoch": 0.6235921754593954, "grad_norm": 0.53125, "learning_rate": 0.00019986460706576496, "loss": 0.8937, "step": 5260 }, { "contrastive_loss": 4.03857421875, "epoch": 0.6235921754593954, "mse_loss": 0.09426240622997284, "step": 5260 }, { "epoch": 0.6247777119146414, "grad_norm": 0.67578125, "learning_rate": 0.00019986244821805217, "loss": 0.8955, "step": 5270 }, { "contrastive_loss": 4.082763671875, "epoch": 0.6247777119146414, "mse_loss": 0.10890883952379227, "step": 5270 }, { "epoch": 0.6259632483698874, "grad_norm": 0.6953125, "learning_rate": 0.00019986027230657825, "loss": 0.9003, "step": 5280 }, { "contrastive_loss": 3.991943359375, "epoch": 0.6259632483698874, "mse_loss": 0.10017138719558716, "step": 5280 }, { "epoch": 0.6271487848251334, "grad_norm": 0.8046875, "learning_rate": 0.00019985807933171494, "loss": 0.8883, "step": 5290 }, { "contrastive_loss": 4.143310546875, "epoch": 0.6271487848251334, "mse_loss": 0.10555099695920944, "step": 5290 }, { "epoch": 0.6283343212803794, "grad_norm": 0.66015625, "learning_rate": 0.00019985586929383703, "loss": 0.8943, "step": 5300 }, { "contrastive_loss": 3.9141845703125, "epoch": 0.6283343212803794, "mse_loss": 0.08333516865968704, "step": 5300 }, { "epoch": 0.6295198577356254, "grad_norm": 0.62109375, "learning_rate": 0.0001998536421933221, "loss": 0.8861, "step": 5310 }, { "contrastive_loss": 4.0806884765625, "epoch": 0.6295198577356254, "mse_loss": 0.11529167741537094, "step": 5310 }, { "epoch": 0.6307053941908713, "grad_norm": 0.4296875, "learning_rate": 0.00019985139803055076, "loss": 0.904, "step": 5320 }, { "contrastive_loss": 4.0225830078125, "epoch": 0.6307053941908713, "mse_loss": 0.08373356610536575, "step": 5320 }, { "epoch": 0.6318909306461173, "grad_norm": 0.5, "learning_rate": 0.0001998491368059064, "loss": 0.8891, "step": 5330 }, { "contrastive_loss": 4.119873046875, "epoch": 0.6318909306461173, "mse_loss": 0.14263859391212463, "step": 5330 }, { "epoch": 0.6330764671013633, "grad_norm": 0.54296875, "learning_rate": 0.00019984685851977548, "loss": 0.9088, "step": 5340 }, { "contrastive_loss": 4.291015625, "epoch": 0.6330764671013633, "mse_loss": 0.09673665463924408, "step": 5340 }, { "epoch": 0.6342620035566093, "grad_norm": 0.6171875, "learning_rate": 0.00019984456317254722, "loss": 0.8951, "step": 5350 }, { "contrastive_loss": 4.101318359375, "epoch": 0.6342620035566093, "mse_loss": 0.07182566076517105, "step": 5350 }, { "epoch": 0.6354475400118553, "grad_norm": 0.51953125, "learning_rate": 0.00019984225076461387, "loss": 0.8887, "step": 5360 }, { "contrastive_loss": 4.1097412109375, "epoch": 0.6354475400118553, "mse_loss": 0.10218970477581024, "step": 5360 }, { "epoch": 0.6366330764671013, "grad_norm": 0.7109375, "learning_rate": 0.00019983992129637054, "loss": 0.8876, "step": 5370 }, { "contrastive_loss": 4.019775390625, "epoch": 0.6366330764671013, "mse_loss": 0.05054580420255661, "step": 5370 }, { "epoch": 0.6378186129223473, "grad_norm": 0.51953125, "learning_rate": 0.00019983757476821535, "loss": 0.8976, "step": 5380 }, { "contrastive_loss": 3.8626708984375, "epoch": 0.6378186129223473, "mse_loss": 0.07208447903394699, "step": 5380 }, { "epoch": 0.6390041493775933, "grad_norm": 0.51171875, "learning_rate": 0.00019983521118054914, "loss": 0.8875, "step": 5390 }, { "contrastive_loss": 4.0478515625, "epoch": 0.6390041493775933, "mse_loss": 0.07745320349931717, "step": 5390 }, { "epoch": 0.6401896858328393, "grad_norm": 0.515625, "learning_rate": 0.00019983283053377586, "loss": 0.8824, "step": 5400 }, { "contrastive_loss": 4.0025634765625, "epoch": 0.6401896858328393, "mse_loss": 0.0860869511961937, "step": 5400 }, { "epoch": 0.6413752222880854, "grad_norm": 0.6796875, "learning_rate": 0.00019983043282830227, "loss": 0.8916, "step": 5410 }, { "contrastive_loss": 4.1014404296875, "epoch": 0.6413752222880854, "mse_loss": 0.09372437745332718, "step": 5410 }, { "epoch": 0.6425607587433314, "grad_norm": 0.56640625, "learning_rate": 0.00019982801806453808, "loss": 0.8857, "step": 5420 }, { "contrastive_loss": 3.8485107421875, "epoch": 0.6425607587433314, "mse_loss": 0.08057431131601334, "step": 5420 }, { "epoch": 0.6437462951985774, "grad_norm": 0.51953125, "learning_rate": 0.00019982558624289588, "loss": 0.8885, "step": 5430 }, { "contrastive_loss": 4.101806640625, "epoch": 0.6437462951985774, "mse_loss": 0.06881527602672577, "step": 5430 }, { "epoch": 0.6449318316538234, "grad_norm": 0.62109375, "learning_rate": 0.00019982313736379128, "loss": 0.8951, "step": 5440 }, { "contrastive_loss": 3.9381103515625, "epoch": 0.6449318316538234, "mse_loss": 0.08089201897382736, "step": 5440 }, { "epoch": 0.6461173681090694, "grad_norm": 0.50390625, "learning_rate": 0.00019982067142764262, "loss": 0.8942, "step": 5450 }, { "contrastive_loss": 3.958984375, "epoch": 0.6461173681090694, "mse_loss": 0.07096078246831894, "step": 5450 }, { "epoch": 0.6473029045643154, "grad_norm": 0.4453125, "learning_rate": 0.00019981818843487137, "loss": 0.8856, "step": 5460 }, { "contrastive_loss": 4.2294921875, "epoch": 0.6473029045643154, "mse_loss": 0.08829251676797867, "step": 5460 }, { "epoch": 0.6484884410195614, "grad_norm": 0.5, "learning_rate": 0.0001998156883859017, "loss": 0.8816, "step": 5470 }, { "contrastive_loss": 4.037109375, "epoch": 0.6484884410195614, "mse_loss": 0.0881347507238388, "step": 5470 }, { "epoch": 0.6496739774748074, "grad_norm": 0.453125, "learning_rate": 0.00019981317128116088, "loss": 0.8764, "step": 5480 }, { "contrastive_loss": 3.9794921875, "epoch": 0.6496739774748074, "mse_loss": 0.08556265383958817, "step": 5480 }, { "epoch": 0.6508595139300534, "grad_norm": 0.48046875, "learning_rate": 0.00019981063712107896, "loss": 0.8907, "step": 5490 }, { "contrastive_loss": 4.0860595703125, "epoch": 0.6508595139300534, "mse_loss": 0.0637243241071701, "step": 5490 }, { "epoch": 0.6520450503852994, "grad_norm": 0.53125, "learning_rate": 0.000199808085906089, "loss": 0.8876, "step": 5500 }, { "contrastive_loss": 3.9796142578125, "epoch": 0.6520450503852994, "mse_loss": 0.06334640830755234, "step": 5500 }, { "epoch": 0.6532305868405454, "grad_norm": 0.56640625, "learning_rate": 0.00019980551763662692, "loss": 0.8812, "step": 5510 }, { "contrastive_loss": 4.1143798828125, "epoch": 0.6532305868405454, "mse_loss": 0.08855058252811432, "step": 5510 }, { "epoch": 0.6544161232957914, "grad_norm": 0.419921875, "learning_rate": 0.00019980293231313154, "loss": 0.8803, "step": 5520 }, { "contrastive_loss": 3.9951171875, "epoch": 0.6544161232957914, "mse_loss": 0.09987704455852509, "step": 5520 }, { "epoch": 0.6556016597510373, "grad_norm": 0.5546875, "learning_rate": 0.00019980032993604466, "loss": 0.8938, "step": 5530 }, { "contrastive_loss": 4.008544921875, "epoch": 0.6556016597510373, "mse_loss": 0.08178029209375381, "step": 5530 }, { "epoch": 0.6567871962062833, "grad_norm": 0.5703125, "learning_rate": 0.00019979771050581096, "loss": 0.8885, "step": 5540 }, { "contrastive_loss": 4.221435546875, "epoch": 0.6567871962062833, "mse_loss": 0.0811576172709465, "step": 5540 }, { "epoch": 0.6579727326615293, "grad_norm": 0.5703125, "learning_rate": 0.00019979507402287795, "loss": 0.8902, "step": 5550 }, { "contrastive_loss": 3.857177734375, "epoch": 0.6579727326615293, "mse_loss": 0.11301545053720474, "step": 5550 }, { "epoch": 0.6591582691167753, "grad_norm": 0.66796875, "learning_rate": 0.00019979242048769624, "loss": 0.8806, "step": 5560 }, { "contrastive_loss": 3.912841796875, "epoch": 0.6591582691167753, "mse_loss": 0.061573777347803116, "step": 5560 }, { "epoch": 0.6603438055720213, "grad_norm": 0.69921875, "learning_rate": 0.00019978974990071918, "loss": 0.8893, "step": 5570 }, { "contrastive_loss": 4.050537109375, "epoch": 0.6603438055720213, "mse_loss": 0.09140723198652267, "step": 5570 }, { "epoch": 0.6615293420272673, "grad_norm": 0.6875, "learning_rate": 0.00019978706226240312, "loss": 0.8853, "step": 5580 }, { "contrastive_loss": 4.0582275390625, "epoch": 0.6615293420272673, "mse_loss": 0.06339161843061447, "step": 5580 }, { "epoch": 0.6627148784825133, "grad_norm": 0.6796875, "learning_rate": 0.00019978435757320731, "loss": 0.889, "step": 5590 }, { "contrastive_loss": 4.22314453125, "epoch": 0.6627148784825133, "mse_loss": 0.08807867765426636, "step": 5590 }, { "epoch": 0.6639004149377593, "grad_norm": 0.578125, "learning_rate": 0.0001997816358335939, "loss": 0.8729, "step": 5600 }, { "contrastive_loss": 3.889404296875, "epoch": 0.6639004149377593, "mse_loss": 0.0909937396645546, "step": 5600 }, { "epoch": 0.6650859513930053, "grad_norm": 0.51171875, "learning_rate": 0.00019977889704402794, "loss": 0.8837, "step": 5610 }, { "contrastive_loss": 3.946044921875, "epoch": 0.6650859513930053, "mse_loss": 0.08057982474565506, "step": 5610 }, { "epoch": 0.6662714878482513, "grad_norm": 0.74609375, "learning_rate": 0.00019977614120497746, "loss": 0.8868, "step": 5620 }, { "contrastive_loss": 4.0244140625, "epoch": 0.6662714878482513, "mse_loss": 0.08236347138881683, "step": 5620 }, { "epoch": 0.6674570243034973, "grad_norm": 0.6328125, "learning_rate": 0.0001997733683169133, "loss": 0.8861, "step": 5630 }, { "contrastive_loss": 3.9810791015625, "epoch": 0.6674570243034973, "mse_loss": 0.11340443044900894, "step": 5630 }, { "epoch": 0.6686425607587433, "grad_norm": 0.53515625, "learning_rate": 0.00019977057838030932, "loss": 0.901, "step": 5640 }, { "contrastive_loss": 4.0631103515625, "epoch": 0.6686425607587433, "mse_loss": 0.0788053423166275, "step": 5640 }, { "epoch": 0.6698280972139893, "grad_norm": 0.52734375, "learning_rate": 0.00019976777139564224, "loss": 0.8835, "step": 5650 }, { "contrastive_loss": 3.9083251953125, "epoch": 0.6698280972139893, "mse_loss": 0.07036475837230682, "step": 5650 }, { "epoch": 0.6710136336692353, "grad_norm": 0.55078125, "learning_rate": 0.00019976494736339165, "loss": 0.8919, "step": 5660 }, { "contrastive_loss": 4.072021484375, "epoch": 0.6710136336692353, "mse_loss": 0.09468164294958115, "step": 5660 }, { "epoch": 0.6721991701244814, "grad_norm": 0.447265625, "learning_rate": 0.00019976210628404014, "loss": 0.8801, "step": 5670 }, { "contrastive_loss": 3.952392578125, "epoch": 0.6721991701244814, "mse_loss": 0.07225848734378815, "step": 5670 }, { "epoch": 0.6733847065797274, "grad_norm": 0.56640625, "learning_rate": 0.00019975924815807317, "loss": 0.8896, "step": 5680 }, { "contrastive_loss": 4.046142578125, "epoch": 0.6733847065797274, "mse_loss": 0.0889502763748169, "step": 5680 }, { "epoch": 0.6745702430349734, "grad_norm": 0.470703125, "learning_rate": 0.00019975637298597914, "loss": 0.8695, "step": 5690 }, { "contrastive_loss": 4.1240234375, "epoch": 0.6745702430349734, "mse_loss": 0.08356472104787827, "step": 5690 }, { "epoch": 0.6757557794902194, "grad_norm": 0.3828125, "learning_rate": 0.0001997534807682493, "loss": 0.8822, "step": 5700 }, { "contrastive_loss": 3.98876953125, "epoch": 0.6757557794902194, "mse_loss": 0.0753662958741188, "step": 5700 }, { "epoch": 0.6769413159454654, "grad_norm": 0.828125, "learning_rate": 0.00019975057150537783, "loss": 0.8987, "step": 5710 }, { "contrastive_loss": 3.9566650390625, "epoch": 0.6769413159454654, "mse_loss": 0.08111635595560074, "step": 5710 }, { "epoch": 0.6781268524007114, "grad_norm": 0.53125, "learning_rate": 0.0001997476451978619, "loss": 0.9043, "step": 5720 }, { "contrastive_loss": 3.962890625, "epoch": 0.6781268524007114, "mse_loss": 0.07490185648202896, "step": 5720 }, { "epoch": 0.6793123888559573, "grad_norm": 0.5546875, "learning_rate": 0.00019974470184620148, "loss": 0.8932, "step": 5730 }, { "contrastive_loss": 4.0213623046875, "epoch": 0.6793123888559573, "mse_loss": 0.0889774039387703, "step": 5730 }, { "epoch": 0.6804979253112033, "grad_norm": 0.57421875, "learning_rate": 0.00019974174145089956, "loss": 0.8912, "step": 5740 }, { "contrastive_loss": 3.982421875, "epoch": 0.6804979253112033, "mse_loss": 0.07558859884738922, "step": 5740 }, { "epoch": 0.6816834617664493, "grad_norm": 0.53515625, "learning_rate": 0.000199738764012462, "loss": 0.8804, "step": 5750 }, { "contrastive_loss": 4.1141357421875, "epoch": 0.6816834617664493, "mse_loss": 0.07872138172388077, "step": 5750 }, { "epoch": 0.6828689982216953, "grad_norm": 0.44921875, "learning_rate": 0.0001997357695313975, "loss": 0.8789, "step": 5760 }, { "contrastive_loss": 4.035888671875, "epoch": 0.6828689982216953, "mse_loss": 0.08431144058704376, "step": 5760 }, { "epoch": 0.6840545346769413, "grad_norm": 0.55859375, "learning_rate": 0.00019973275800821774, "loss": 0.8903, "step": 5770 }, { "contrastive_loss": 3.99853515625, "epoch": 0.6840545346769413, "mse_loss": 0.10123618692159653, "step": 5770 }, { "epoch": 0.6852400711321873, "grad_norm": 0.4921875, "learning_rate": 0.00019972972944343737, "loss": 0.8909, "step": 5780 }, { "contrastive_loss": 4.0831298828125, "epoch": 0.6852400711321873, "mse_loss": 0.07698731124401093, "step": 5780 }, { "epoch": 0.6864256075874333, "grad_norm": 0.546875, "learning_rate": 0.00019972668383757384, "loss": 0.8908, "step": 5790 }, { "contrastive_loss": 3.895263671875, "epoch": 0.6864256075874333, "mse_loss": 0.07198388874530792, "step": 5790 }, { "epoch": 0.6876111440426793, "grad_norm": 0.578125, "learning_rate": 0.00019972362119114755, "loss": 0.8966, "step": 5800 }, { "contrastive_loss": 3.994873046875, "epoch": 0.6876111440426793, "mse_loss": 0.10105441510677338, "step": 5800 }, { "epoch": 0.6887966804979253, "grad_norm": 0.498046875, "learning_rate": 0.00019972054150468188, "loss": 0.8793, "step": 5810 }, { "contrastive_loss": 4.0018310546875, "epoch": 0.6887966804979253, "mse_loss": 0.08420336246490479, "step": 5810 }, { "epoch": 0.6899822169531713, "grad_norm": 0.50390625, "learning_rate": 0.00019971744477870304, "loss": 0.8847, "step": 5820 }, { "contrastive_loss": 3.9434814453125, "epoch": 0.6899822169531713, "mse_loss": 0.0620688833296299, "step": 5820 }, { "epoch": 0.6911677534084173, "grad_norm": 0.482421875, "learning_rate": 0.00019971433101374016, "loss": 0.8867, "step": 5830 }, { "contrastive_loss": 4.179443359375, "epoch": 0.6911677534084173, "mse_loss": 0.0887310653924942, "step": 5830 }, { "epoch": 0.6923532898636633, "grad_norm": 0.65625, "learning_rate": 0.00019971120021032527, "loss": 0.8935, "step": 5840 }, { "contrastive_loss": 3.853759765625, "epoch": 0.6923532898636633, "mse_loss": 0.12120281159877777, "step": 5840 }, { "epoch": 0.6935388263189093, "grad_norm": 0.55859375, "learning_rate": 0.00019970805236899336, "loss": 0.8988, "step": 5850 }, { "contrastive_loss": 4.0472412109375, "epoch": 0.6935388263189093, "mse_loss": 0.10384386032819748, "step": 5850 }, { "epoch": 0.6947243627741553, "grad_norm": 0.439453125, "learning_rate": 0.00019970488749028237, "loss": 0.8875, "step": 5860 }, { "contrastive_loss": 4.02587890625, "epoch": 0.6947243627741553, "mse_loss": 0.0839611366391182, "step": 5860 }, { "epoch": 0.6959098992294013, "grad_norm": 0.5078125, "learning_rate": 0.00019970170557473302, "loss": 0.8787, "step": 5870 }, { "contrastive_loss": 3.9537353515625, "epoch": 0.6959098992294013, "mse_loss": 0.07761891931295395, "step": 5870 }, { "epoch": 0.6970954356846473, "grad_norm": 0.83984375, "learning_rate": 0.00019969850662288904, "loss": 0.9015, "step": 5880 }, { "contrastive_loss": 4.018798828125, "epoch": 0.6970954356846473, "mse_loss": 0.08958861976861954, "step": 5880 }, { "epoch": 0.6982809721398933, "grad_norm": 0.59765625, "learning_rate": 0.00019969529063529703, "loss": 0.8811, "step": 5890 }, { "contrastive_loss": 3.97021484375, "epoch": 0.6982809721398933, "mse_loss": 0.09156129509210587, "step": 5890 }, { "epoch": 0.6994665085951393, "grad_norm": 0.4453125, "learning_rate": 0.00019969205761250652, "loss": 0.8833, "step": 5900 }, { "contrastive_loss": 3.9488525390625, "epoch": 0.6994665085951393, "mse_loss": 0.10839634388685226, "step": 5900 }, { "epoch": 0.7006520450503853, "grad_norm": 0.6953125, "learning_rate": 0.00019968880755507, "loss": 0.8775, "step": 5910 }, { "contrastive_loss": 3.906982421875, "epoch": 0.7006520450503853, "mse_loss": 0.0712883397936821, "step": 5910 }, { "epoch": 0.7018375815056312, "grad_norm": 0.5703125, "learning_rate": 0.0001996855404635427, "loss": 0.8824, "step": 5920 }, { "contrastive_loss": 3.9024658203125, "epoch": 0.7018375815056312, "mse_loss": 0.07802868634462357, "step": 5920 }, { "epoch": 0.7030231179608772, "grad_norm": 0.54296875, "learning_rate": 0.00019968225633848296, "loss": 0.8697, "step": 5930 }, { "contrastive_loss": 3.946044921875, "epoch": 0.7030231179608772, "mse_loss": 0.06795169413089752, "step": 5930 }, { "epoch": 0.7042086544161233, "grad_norm": 0.4296875, "learning_rate": 0.0001996789551804519, "loss": 0.8828, "step": 5940 }, { "contrastive_loss": 4.172607421875, "epoch": 0.7042086544161233, "mse_loss": 0.08697165548801422, "step": 5940 }, { "epoch": 0.7053941908713693, "grad_norm": 0.494140625, "learning_rate": 0.00019967563699001365, "loss": 0.8892, "step": 5950 }, { "contrastive_loss": 3.9833984375, "epoch": 0.7053941908713693, "mse_loss": 0.08351363241672516, "step": 5950 }, { "epoch": 0.7065797273266153, "grad_norm": 0.609375, "learning_rate": 0.0001996723017677352, "loss": 0.8791, "step": 5960 }, { "contrastive_loss": 4.01318359375, "epoch": 0.7065797273266153, "mse_loss": 0.12079516798257828, "step": 5960 }, { "epoch": 0.7077652637818613, "grad_norm": 0.412109375, "learning_rate": 0.0001996689495141864, "loss": 0.8841, "step": 5970 }, { "contrastive_loss": 4.0167236328125, "epoch": 0.7077652637818613, "mse_loss": 0.0725620836019516, "step": 5970 }, { "epoch": 0.7089508002371073, "grad_norm": 0.380859375, "learning_rate": 0.00019966558022994007, "loss": 0.8757, "step": 5980 }, { "contrastive_loss": 3.9044189453125, "epoch": 0.7089508002371073, "mse_loss": 0.09105867147445679, "step": 5980 }, { "epoch": 0.7101363366923533, "grad_norm": 0.63671875, "learning_rate": 0.00019966219391557191, "loss": 0.8712, "step": 5990 }, { "contrastive_loss": 4.1260986328125, "epoch": 0.7101363366923533, "mse_loss": 0.08027661591768265, "step": 5990 }, { "epoch": 0.7113218731475993, "grad_norm": 0.427734375, "learning_rate": 0.00019965879057166064, "loss": 0.8848, "step": 6000 }, { "contrastive_loss": 3.9373779296875, "epoch": 0.7113218731475993, "mse_loss": 0.0864320769906044, "step": 6000 }, { "epoch": 0.7125074096028453, "grad_norm": 0.52734375, "learning_rate": 0.0001996553701987877, "loss": 0.8799, "step": 6010 }, { "contrastive_loss": 3.9481201171875, "epoch": 0.7125074096028453, "mse_loss": 0.11310837417840958, "step": 6010 }, { "epoch": 0.7136929460580913, "grad_norm": 0.5078125, "learning_rate": 0.00019965193279753758, "loss": 0.8715, "step": 6020 }, { "contrastive_loss": 3.93505859375, "epoch": 0.7136929460580913, "mse_loss": 0.07935861498117447, "step": 6020 }, { "epoch": 0.7148784825133373, "grad_norm": 0.494140625, "learning_rate": 0.00019964847836849762, "loss": 0.8784, "step": 6030 }, { "contrastive_loss": 4.0787353515625, "epoch": 0.7148784825133373, "mse_loss": 0.09782583266496658, "step": 6030 }, { "epoch": 0.7160640189685833, "grad_norm": 0.466796875, "learning_rate": 0.00019964500691225815, "loss": 0.8809, "step": 6040 }, { "contrastive_loss": 4.0203857421875, "epoch": 0.7160640189685833, "mse_loss": 0.07246323674917221, "step": 6040 }, { "epoch": 0.7172495554238293, "grad_norm": 0.57421875, "learning_rate": 0.00019964151842941221, "loss": 0.8725, "step": 6050 }, { "contrastive_loss": 3.9407958984375, "epoch": 0.7172495554238293, "mse_loss": 0.0782233327627182, "step": 6050 }, { "epoch": 0.7184350918790753, "grad_norm": 0.640625, "learning_rate": 0.00019963801292055604, "loss": 0.8805, "step": 6060 }, { "contrastive_loss": 4.0316162109375, "epoch": 0.7184350918790753, "mse_loss": 0.08549577742815018, "step": 6060 }, { "epoch": 0.7196206283343213, "grad_norm": 0.4921875, "learning_rate": 0.0001996344903862885, "loss": 0.8833, "step": 6070 }, { "contrastive_loss": 4.091796875, "epoch": 0.7196206283343213, "mse_loss": 0.07454199343919754, "step": 6070 }, { "epoch": 0.7208061647895673, "grad_norm": 0.494140625, "learning_rate": 0.00019963095082721163, "loss": 0.885, "step": 6080 }, { "contrastive_loss": 4.0494384765625, "epoch": 0.7208061647895673, "mse_loss": 0.07284482568502426, "step": 6080 }, { "epoch": 0.7219917012448133, "grad_norm": 0.63671875, "learning_rate": 0.00019962739424393016, "loss": 0.8838, "step": 6090 }, { "contrastive_loss": 4.091552734375, "epoch": 0.7219917012448133, "mse_loss": 0.11091990023851395, "step": 6090 }, { "epoch": 0.7231772377000593, "grad_norm": 0.609375, "learning_rate": 0.00019962382063705184, "loss": 0.8878, "step": 6100 }, { "contrastive_loss": 3.919677734375, "epoch": 0.7231772377000593, "mse_loss": 0.07419133931398392, "step": 6100 }, { "epoch": 0.7243627741553053, "grad_norm": 0.5703125, "learning_rate": 0.00019962023000718725, "loss": 0.8947, "step": 6110 }, { "contrastive_loss": 4.0245361328125, "epoch": 0.7243627741553053, "mse_loss": 0.09717658907175064, "step": 6110 }, { "epoch": 0.7255483106105513, "grad_norm": 0.6171875, "learning_rate": 0.00019961662235495, "loss": 0.8941, "step": 6120 }, { "contrastive_loss": 4.0283203125, "epoch": 0.7255483106105513, "mse_loss": 0.1029597595334053, "step": 6120 }, { "epoch": 0.7267338470657972, "grad_norm": 0.35546875, "learning_rate": 0.0001996129976809565, "loss": 0.8828, "step": 6130 }, { "contrastive_loss": 4.16259765625, "epoch": 0.7267338470657972, "mse_loss": 0.07264114916324615, "step": 6130 }, { "epoch": 0.7279193835210432, "grad_norm": 0.62890625, "learning_rate": 0.00019960935598582614, "loss": 0.8826, "step": 6140 }, { "contrastive_loss": 3.8785400390625, "epoch": 0.7279193835210432, "mse_loss": 0.07976304739713669, "step": 6140 }, { "epoch": 0.7291049199762892, "grad_norm": 0.5, "learning_rate": 0.00019960569727018115, "loss": 0.8644, "step": 6150 }, { "contrastive_loss": 3.9727783203125, "epoch": 0.7291049199762892, "mse_loss": 0.08169496059417725, "step": 6150 }, { "epoch": 0.7302904564315352, "grad_norm": 0.416015625, "learning_rate": 0.00019960202153464668, "loss": 0.8824, "step": 6160 }, { "contrastive_loss": 3.844482421875, "epoch": 0.7302904564315352, "mse_loss": 0.1066582053899765, "step": 6160 }, { "epoch": 0.7314759928867812, "grad_norm": 0.56640625, "learning_rate": 0.0001995983287798509, "loss": 0.8944, "step": 6170 }, { "contrastive_loss": 4.126708984375, "epoch": 0.7314759928867812, "mse_loss": 0.08271251618862152, "step": 6170 }, { "epoch": 0.7326615293420272, "grad_norm": 0.609375, "learning_rate": 0.00019959461900642475, "loss": 0.884, "step": 6180 }, { "contrastive_loss": 3.9122314453125, "epoch": 0.7326615293420272, "mse_loss": 0.07647073268890381, "step": 6180 }, { "epoch": 0.7338470657972732, "grad_norm": 0.5, "learning_rate": 0.00019959089221500208, "loss": 0.8881, "step": 6190 }, { "contrastive_loss": 4.08056640625, "epoch": 0.7338470657972732, "mse_loss": 0.08905960619449615, "step": 6190 }, { "epoch": 0.7350326022525193, "grad_norm": 0.62109375, "learning_rate": 0.0001995871484062198, "loss": 0.887, "step": 6200 }, { "contrastive_loss": 3.8851318359375, "epoch": 0.7350326022525193, "mse_loss": 0.07539854198694229, "step": 6200 }, { "epoch": 0.7362181387077653, "grad_norm": 0.453125, "learning_rate": 0.00019958338758071755, "loss": 0.887, "step": 6210 }, { "contrastive_loss": 3.95849609375, "epoch": 0.7362181387077653, "mse_loss": 0.08888355642557144, "step": 6210 }, { "epoch": 0.7374036751630113, "grad_norm": 0.52734375, "learning_rate": 0.00019957960973913797, "loss": 0.8743, "step": 6220 }, { "contrastive_loss": 4.0618896484375, "epoch": 0.7374036751630113, "mse_loss": 0.09091299027204514, "step": 6220 }, { "epoch": 0.7385892116182573, "grad_norm": 0.404296875, "learning_rate": 0.00019957581488212663, "loss": 0.8761, "step": 6230 }, { "contrastive_loss": 3.9654541015625, "epoch": 0.7385892116182573, "mse_loss": 0.08747311681509018, "step": 6230 }, { "epoch": 0.7397747480735033, "grad_norm": 0.482421875, "learning_rate": 0.00019957200301033189, "loss": 0.8803, "step": 6240 }, { "contrastive_loss": 4.085205078125, "epoch": 0.7397747480735033, "mse_loss": 0.06527847796678543, "step": 6240 }, { "epoch": 0.7409602845287493, "grad_norm": 0.6328125, "learning_rate": 0.00019956817412440517, "loss": 0.8851, "step": 6250 }, { "contrastive_loss": 4.0361328125, "epoch": 0.7409602845287493, "mse_loss": 0.0830717608332634, "step": 6250 }, { "epoch": 0.7421458209839953, "grad_norm": 0.63671875, "learning_rate": 0.00019956432822500065, "loss": 0.8892, "step": 6260 }, { "contrastive_loss": 3.90283203125, "epoch": 0.7421458209839953, "mse_loss": 0.08783972263336182, "step": 6260 }, { "epoch": 0.7433313574392413, "grad_norm": 0.53515625, "learning_rate": 0.00019956046531277555, "loss": 0.8867, "step": 6270 }, { "contrastive_loss": 3.8731689453125, "epoch": 0.7433313574392413, "mse_loss": 0.07834357023239136, "step": 6270 }, { "epoch": 0.7445168938944873, "grad_norm": 0.58984375, "learning_rate": 0.0001995565853883899, "loss": 0.883, "step": 6280 }, { "contrastive_loss": 4.0731201171875, "epoch": 0.7445168938944873, "mse_loss": 0.10195982456207275, "step": 6280 }, { "epoch": 0.7457024303497333, "grad_norm": 0.58203125, "learning_rate": 0.0001995526884525067, "loss": 0.8826, "step": 6290 }, { "contrastive_loss": 4.046142578125, "epoch": 0.7457024303497333, "mse_loss": 0.05674920231103897, "step": 6290 }, { "epoch": 0.7468879668049793, "grad_norm": 0.42578125, "learning_rate": 0.0001995487745057918, "loss": 0.8726, "step": 6300 }, { "contrastive_loss": 3.9603271484375, "epoch": 0.7468879668049793, "mse_loss": 0.06932329386472702, "step": 6300 }, { "epoch": 0.7480735032602253, "grad_norm": 0.486328125, "learning_rate": 0.000199544843548914, "loss": 0.879, "step": 6310 }, { "contrastive_loss": 4.0220947265625, "epoch": 0.7480735032602253, "mse_loss": 0.055201344192028046, "step": 6310 }, { "epoch": 0.7492590397154713, "grad_norm": 0.50390625, "learning_rate": 0.00019954089558254503, "loss": 0.885, "step": 6320 }, { "contrastive_loss": 4.050537109375, "epoch": 0.7492590397154713, "mse_loss": 0.08740226179361343, "step": 6320 }, { "epoch": 0.7504445761707172, "grad_norm": 0.53125, "learning_rate": 0.00019953693060735942, "loss": 0.8781, "step": 6330 }, { "contrastive_loss": 3.958251953125, "epoch": 0.7504445761707172, "mse_loss": 0.1113736629486084, "step": 6330 }, { "epoch": 0.7516301126259632, "grad_norm": 0.52734375, "learning_rate": 0.0001995329486240347, "loss": 0.8901, "step": 6340 }, { "contrastive_loss": 3.9462890625, "epoch": 0.7516301126259632, "mse_loss": 0.08414248377084732, "step": 6340 }, { "epoch": 0.7528156490812092, "grad_norm": 0.546875, "learning_rate": 0.00019952894963325135, "loss": 0.8743, "step": 6350 }, { "contrastive_loss": 3.8148193359375, "epoch": 0.7528156490812092, "mse_loss": 0.057771120220422745, "step": 6350 }, { "epoch": 0.7540011855364552, "grad_norm": 0.50390625, "learning_rate": 0.00019952493363569257, "loss": 0.8743, "step": 6360 }, { "contrastive_loss": 4.038330078125, "epoch": 0.7540011855364552, "mse_loss": 0.09426146000623703, "step": 6360 }, { "epoch": 0.7551867219917012, "grad_norm": 0.51953125, "learning_rate": 0.00019952090063204468, "loss": 0.8786, "step": 6370 }, { "contrastive_loss": 4.0999755859375, "epoch": 0.7551867219917012, "mse_loss": 0.07461632788181305, "step": 6370 }, { "epoch": 0.7563722584469472, "grad_norm": 0.66015625, "learning_rate": 0.00019951685062299674, "loss": 0.8829, "step": 6380 }, { "contrastive_loss": 3.980712890625, "epoch": 0.7563722584469472, "mse_loss": 0.09298665076494217, "step": 6380 }, { "epoch": 0.7575577949021932, "grad_norm": 0.53125, "learning_rate": 0.00019951278360924086, "loss": 0.8782, "step": 6390 }, { "contrastive_loss": 4.0823974609375, "epoch": 0.7575577949021932, "mse_loss": 0.0877332091331482, "step": 6390 }, { "epoch": 0.7587433313574392, "grad_norm": 0.39453125, "learning_rate": 0.00019950869959147193, "loss": 0.8757, "step": 6400 }, { "contrastive_loss": 4.156005859375, "epoch": 0.7587433313574392, "mse_loss": 0.08453533798456192, "step": 6400 }, { "epoch": 0.7599288678126852, "grad_norm": 0.59765625, "learning_rate": 0.0001995045985703878, "loss": 0.884, "step": 6410 }, { "contrastive_loss": 4.01904296875, "epoch": 0.7599288678126852, "mse_loss": 0.09598295390605927, "step": 6410 }, { "epoch": 0.7611144042679312, "grad_norm": 0.5234375, "learning_rate": 0.00019950048054668922, "loss": 0.8834, "step": 6420 }, { "contrastive_loss": 4.0032958984375, "epoch": 0.7611144042679312, "mse_loss": 0.09277383983135223, "step": 6420 }, { "epoch": 0.7622999407231772, "grad_norm": 0.5, "learning_rate": 0.00019949634552107986, "loss": 0.8816, "step": 6430 }, { "contrastive_loss": 3.935302734375, "epoch": 0.7622999407231772, "mse_loss": 0.09140445291996002, "step": 6430 }, { "epoch": 0.7634854771784232, "grad_norm": 0.435546875, "learning_rate": 0.0001994921934942663, "loss": 0.8852, "step": 6440 }, { "contrastive_loss": 3.9306640625, "epoch": 0.7634854771784232, "mse_loss": 0.06811203807592392, "step": 6440 }, { "epoch": 0.7646710136336692, "grad_norm": 0.66015625, "learning_rate": 0.000199488024466958, "loss": 0.8716, "step": 6450 }, { "contrastive_loss": 3.854248046875, "epoch": 0.7646710136336692, "mse_loss": 0.08157406747341156, "step": 6450 }, { "epoch": 0.7658565500889153, "grad_norm": 0.53515625, "learning_rate": 0.0001994838384398673, "loss": 0.8838, "step": 6460 }, { "contrastive_loss": 3.8773193359375, "epoch": 0.7658565500889153, "mse_loss": 0.06990977376699448, "step": 6460 }, { "epoch": 0.7670420865441613, "grad_norm": 0.69921875, "learning_rate": 0.0001994796354137095, "loss": 0.8656, "step": 6470 }, { "contrastive_loss": 3.9521484375, "epoch": 0.7670420865441613, "mse_loss": 0.08867408335208893, "step": 6470 }, { "epoch": 0.7682276229994073, "grad_norm": 0.455078125, "learning_rate": 0.0001994754153892028, "loss": 0.8693, "step": 6480 }, { "contrastive_loss": 3.9439697265625, "epoch": 0.7682276229994073, "mse_loss": 0.07101339846849442, "step": 6480 }, { "epoch": 0.7694131594546533, "grad_norm": 0.609375, "learning_rate": 0.00019947117836706824, "loss": 0.8819, "step": 6490 }, { "contrastive_loss": 3.9288330078125, "epoch": 0.7694131594546533, "mse_loss": 0.07587499171495438, "step": 6490 }, { "epoch": 0.7705986959098993, "grad_norm": 0.5078125, "learning_rate": 0.00019946692434802987, "loss": 0.869, "step": 6500 }, { "contrastive_loss": 3.93310546875, "epoch": 0.7705986959098993, "mse_loss": 0.08535822480916977, "step": 6500 }, { "epoch": 0.7717842323651453, "grad_norm": 0.59375, "learning_rate": 0.00019946265333281452, "loss": 0.8768, "step": 6510 }, { "contrastive_loss": 4.0054931640625, "epoch": 0.7717842323651453, "mse_loss": 0.08132833987474442, "step": 6510 }, { "epoch": 0.7729697688203913, "grad_norm": 0.4140625, "learning_rate": 0.00019945836532215205, "loss": 0.8781, "step": 6520 }, { "contrastive_loss": 4.063720703125, "epoch": 0.7729697688203913, "mse_loss": 0.06349460780620575, "step": 6520 }, { "epoch": 0.7741553052756373, "grad_norm": 0.447265625, "learning_rate": 0.00019945406031677513, "loss": 0.8761, "step": 6530 }, { "contrastive_loss": 4.031005859375, "epoch": 0.7741553052756373, "mse_loss": 0.0843246653676033, "step": 6530 }, { "epoch": 0.7753408417308832, "grad_norm": 0.373046875, "learning_rate": 0.0001994497383174194, "loss": 0.8727, "step": 6540 }, { "contrastive_loss": 4.1265869140625, "epoch": 0.7753408417308832, "mse_loss": 0.0803895965218544, "step": 6540 }, { "epoch": 0.7765263781861292, "grad_norm": 0.54296875, "learning_rate": 0.00019944539932482332, "loss": 0.8881, "step": 6550 }, { "contrastive_loss": 3.94189453125, "epoch": 0.7765263781861292, "mse_loss": 0.06321560591459274, "step": 6550 }, { "epoch": 0.7777119146413752, "grad_norm": 0.46875, "learning_rate": 0.00019944104333972833, "loss": 0.8769, "step": 6560 }, { "contrastive_loss": 3.9149169921875, "epoch": 0.7777119146413752, "mse_loss": 0.08858419954776764, "step": 6560 }, { "epoch": 0.7788974510966212, "grad_norm": 0.54296875, "learning_rate": 0.00019943667036287875, "loss": 0.8715, "step": 6570 }, { "contrastive_loss": 3.95703125, "epoch": 0.7788974510966212, "mse_loss": 0.11789476871490479, "step": 6570 }, { "epoch": 0.7800829875518672, "grad_norm": 0.52734375, "learning_rate": 0.00019943228039502186, "loss": 0.8892, "step": 6580 }, { "contrastive_loss": 4.1185302734375, "epoch": 0.7800829875518672, "mse_loss": 0.08113638311624527, "step": 6580 }, { "epoch": 0.7812685240071132, "grad_norm": 0.58984375, "learning_rate": 0.00019942787343690767, "loss": 0.8766, "step": 6590 }, { "contrastive_loss": 3.90771484375, "epoch": 0.7812685240071132, "mse_loss": 0.0636010393500328, "step": 6590 }, { "epoch": 0.7824540604623592, "grad_norm": 0.50390625, "learning_rate": 0.00019942344948928927, "loss": 0.8749, "step": 6600 }, { "contrastive_loss": 4.04541015625, "epoch": 0.7824540604623592, "mse_loss": 0.07356058806180954, "step": 6600 }, { "epoch": 0.7836395969176052, "grad_norm": 0.482421875, "learning_rate": 0.0001994190085529226, "loss": 0.8713, "step": 6610 }, { "contrastive_loss": 4.0472412109375, "epoch": 0.7836395969176052, "mse_loss": 0.10436280816793442, "step": 6610 }, { "epoch": 0.7848251333728512, "grad_norm": 0.38671875, "learning_rate": 0.00019941455062856648, "loss": 0.8708, "step": 6620 }, { "contrastive_loss": 3.8865966796875, "epoch": 0.7848251333728512, "mse_loss": 0.0768219605088234, "step": 6620 }, { "epoch": 0.7860106698280972, "grad_norm": 0.5546875, "learning_rate": 0.00019941007571698264, "loss": 0.8811, "step": 6630 }, { "contrastive_loss": 3.888671875, "epoch": 0.7860106698280972, "mse_loss": 0.08065687865018845, "step": 6630 }, { "epoch": 0.7871962062833432, "grad_norm": 0.43359375, "learning_rate": 0.00019940558381893576, "loss": 0.8788, "step": 6640 }, { "contrastive_loss": 3.9818115234375, "epoch": 0.7871962062833432, "mse_loss": 0.07989772409200668, "step": 6640 }, { "epoch": 0.7883817427385892, "grad_norm": 0.462890625, "learning_rate": 0.00019940107493519334, "loss": 0.878, "step": 6650 }, { "contrastive_loss": 4.08935546875, "epoch": 0.7883817427385892, "mse_loss": 0.07211867719888687, "step": 6650 }, { "epoch": 0.7895672791938352, "grad_norm": 0.52734375, "learning_rate": 0.00019939654906652585, "loss": 0.8851, "step": 6660 }, { "contrastive_loss": 4.0496826171875, "epoch": 0.7895672791938352, "mse_loss": 0.08928617089986801, "step": 6660 }, { "epoch": 0.7907528156490812, "grad_norm": 0.61328125, "learning_rate": 0.00019939200621370664, "loss": 0.8822, "step": 6670 }, { "contrastive_loss": 4.0528564453125, "epoch": 0.7907528156490812, "mse_loss": 0.07790572196245193, "step": 6670 }, { "epoch": 0.7919383521043272, "grad_norm": 0.5234375, "learning_rate": 0.00019938744637751192, "loss": 0.8836, "step": 6680 }, { "contrastive_loss": 3.9566650390625, "epoch": 0.7919383521043272, "mse_loss": 0.08492223173379898, "step": 6680 }, { "epoch": 0.7931238885595732, "grad_norm": 0.451171875, "learning_rate": 0.00019938286955872086, "loss": 0.8681, "step": 6690 }, { "contrastive_loss": 4.0806884765625, "epoch": 0.7931238885595732, "mse_loss": 0.09193442016839981, "step": 6690 }, { "epoch": 0.7943094250148192, "grad_norm": 0.66796875, "learning_rate": 0.0001993782757581155, "loss": 0.8808, "step": 6700 }, { "contrastive_loss": 3.9833984375, "epoch": 0.7943094250148192, "mse_loss": 0.05181247740983963, "step": 6700 }, { "epoch": 0.7954949614700652, "grad_norm": 0.60546875, "learning_rate": 0.0001993736649764809, "loss": 0.8763, "step": 6710 }, { "contrastive_loss": 4.025634765625, "epoch": 0.7954949614700652, "mse_loss": 0.11340872198343277, "step": 6710 }, { "epoch": 0.7966804979253111, "grad_norm": 0.51953125, "learning_rate": 0.00019936903721460476, "loss": 0.8835, "step": 6720 }, { "contrastive_loss": 3.8984375, "epoch": 0.7966804979253111, "mse_loss": 0.11030034720897675, "step": 6720 }, { "epoch": 0.7978660343805573, "grad_norm": 0.50390625, "learning_rate": 0.00019936439247327791, "loss": 0.8829, "step": 6730 }, { "contrastive_loss": 3.9102783203125, "epoch": 0.7978660343805573, "mse_loss": 0.08126133680343628, "step": 6730 }, { "epoch": 0.7990515708358032, "grad_norm": 0.515625, "learning_rate": 0.00019935973075329403, "loss": 0.8813, "step": 6740 }, { "contrastive_loss": 3.929931640625, "epoch": 0.7990515708358032, "mse_loss": 0.08589009195566177, "step": 6740 }, { "epoch": 0.8002371072910492, "grad_norm": 0.4609375, "learning_rate": 0.00019935505205544965, "loss": 0.865, "step": 6750 }, { "contrastive_loss": 4.199462890625, "epoch": 0.8002371072910492, "mse_loss": 0.06176105514168739, "step": 6750 }, { "epoch": 0.8014226437462952, "grad_norm": 0.431640625, "learning_rate": 0.00019935035638054424, "loss": 0.8719, "step": 6760 }, { "contrastive_loss": 3.9454345703125, "epoch": 0.8014226437462952, "mse_loss": 0.0881158784031868, "step": 6760 }, { "epoch": 0.8026081802015412, "grad_norm": 0.451171875, "learning_rate": 0.00019934564372938018, "loss": 0.857, "step": 6770 }, { "contrastive_loss": 3.958251953125, "epoch": 0.8026081802015412, "mse_loss": 0.07475125789642334, "step": 6770 }, { "epoch": 0.8037937166567872, "grad_norm": 0.60546875, "learning_rate": 0.0001993409141027627, "loss": 0.8807, "step": 6780 }, { "contrastive_loss": 4.0318603515625, "epoch": 0.8037937166567872, "mse_loss": 0.067829430103302, "step": 6780 }, { "epoch": 0.8049792531120332, "grad_norm": 0.447265625, "learning_rate": 0.00019933616750149997, "loss": 0.8719, "step": 6790 }, { "contrastive_loss": 4.0172119140625, "epoch": 0.8049792531120332, "mse_loss": 0.06575574725866318, "step": 6790 }, { "epoch": 0.8061647895672792, "grad_norm": 0.427734375, "learning_rate": 0.0001993314039264031, "loss": 0.8904, "step": 6800 }, { "contrastive_loss": 4.07958984375, "epoch": 0.8061647895672792, "mse_loss": 0.09477537125349045, "step": 6800 }, { "epoch": 0.8073503260225252, "grad_norm": 0.5078125, "learning_rate": 0.00019932662337828597, "loss": 0.8766, "step": 6810 }, { "contrastive_loss": 3.91552734375, "epoch": 0.8073503260225252, "mse_loss": 0.10552208870649338, "step": 6810 }, { "epoch": 0.8085358624777712, "grad_norm": 0.62109375, "learning_rate": 0.00019932182585796554, "loss": 0.8694, "step": 6820 }, { "contrastive_loss": 4.0738525390625, "epoch": 0.8085358624777712, "mse_loss": 0.05551109090447426, "step": 6820 }, { "epoch": 0.8097213989330172, "grad_norm": 0.451171875, "learning_rate": 0.00019931701136626152, "loss": 0.8727, "step": 6830 }, { "contrastive_loss": 3.9193115234375, "epoch": 0.8097213989330172, "mse_loss": 0.07832740247249603, "step": 6830 }, { "epoch": 0.8109069353882632, "grad_norm": 0.546875, "learning_rate": 0.00019931217990399653, "loss": 0.8808, "step": 6840 }, { "contrastive_loss": 4.06494140625, "epoch": 0.8109069353882632, "mse_loss": 0.08040179312229156, "step": 6840 }, { "epoch": 0.8120924718435092, "grad_norm": 0.408203125, "learning_rate": 0.00019930733147199625, "loss": 0.869, "step": 6850 }, { "contrastive_loss": 3.8994140625, "epoch": 0.8120924718435092, "mse_loss": 0.07977216690778732, "step": 6850 }, { "epoch": 0.8132780082987552, "grad_norm": 0.46875, "learning_rate": 0.00019930246607108905, "loss": 0.8809, "step": 6860 }, { "contrastive_loss": 3.9248046875, "epoch": 0.8132780082987552, "mse_loss": 0.08587770909070969, "step": 6860 }, { "epoch": 0.8144635447540012, "grad_norm": 0.55078125, "learning_rate": 0.00019929758370210634, "loss": 0.8936, "step": 6870 }, { "contrastive_loss": 3.92333984375, "epoch": 0.8144635447540012, "mse_loss": 0.07605012506246567, "step": 6870 }, { "epoch": 0.8156490812092472, "grad_norm": 0.51953125, "learning_rate": 0.00019929268436588238, "loss": 0.874, "step": 6880 }, { "contrastive_loss": 4.0074462890625, "epoch": 0.8156490812092472, "mse_loss": 0.10339883714914322, "step": 6880 }, { "epoch": 0.8168346176644932, "grad_norm": 0.515625, "learning_rate": 0.00019928776806325428, "loss": 0.8805, "step": 6890 }, { "contrastive_loss": 4.0435791015625, "epoch": 0.8168346176644932, "mse_loss": 0.05446808785200119, "step": 6890 }, { "epoch": 0.8180201541197392, "grad_norm": 0.408203125, "learning_rate": 0.0001992828347950622, "loss": 0.8626, "step": 6900 }, { "contrastive_loss": 3.9827880859375, "epoch": 0.8180201541197392, "mse_loss": 0.11219538003206253, "step": 6900 }, { "epoch": 0.8192056905749852, "grad_norm": 0.44140625, "learning_rate": 0.00019927788456214902, "loss": 0.8812, "step": 6910 }, { "contrastive_loss": 3.9874267578125, "epoch": 0.8192056905749852, "mse_loss": 0.08201421797275543, "step": 6910 }, { "epoch": 0.8203912270302312, "grad_norm": 0.5390625, "learning_rate": 0.00019927291736536064, "loss": 0.8886, "step": 6920 }, { "contrastive_loss": 3.8812255859375, "epoch": 0.8203912270302312, "mse_loss": 0.07677395641803741, "step": 6920 }, { "epoch": 0.8215767634854771, "grad_norm": 0.392578125, "learning_rate": 0.00019926793320554579, "loss": 0.8666, "step": 6930 }, { "contrastive_loss": 3.939453125, "epoch": 0.8215767634854771, "mse_loss": 0.05839218571782112, "step": 6930 }, { "epoch": 0.8227622999407231, "grad_norm": 0.484375, "learning_rate": 0.00019926293208355613, "loss": 0.8633, "step": 6940 }, { "contrastive_loss": 3.975830078125, "epoch": 0.8227622999407231, "mse_loss": 0.08961587399244308, "step": 6940 }, { "epoch": 0.8239478363959691, "grad_norm": 0.57421875, "learning_rate": 0.00019925791400024622, "loss": 0.8829, "step": 6950 }, { "contrastive_loss": 3.8665771484375, "epoch": 0.8239478363959691, "mse_loss": 0.0766177549958229, "step": 6950 }, { "epoch": 0.8251333728512151, "grad_norm": 0.478515625, "learning_rate": 0.00019925287895647355, "loss": 0.8839, "step": 6960 }, { "contrastive_loss": 3.9122314453125, "epoch": 0.8251333728512151, "mse_loss": 0.07552470266819, "step": 6960 }, { "epoch": 0.8263189093064611, "grad_norm": 0.40625, "learning_rate": 0.00019924782695309842, "loss": 0.8599, "step": 6970 }, { "contrastive_loss": 3.9637451171875, "epoch": 0.8263189093064611, "mse_loss": 0.09375933557748795, "step": 6970 }, { "epoch": 0.8275044457617071, "grad_norm": 0.484375, "learning_rate": 0.00019924275799098408, "loss": 0.8792, "step": 6980 }, { "contrastive_loss": 4.1737060546875, "epoch": 0.8275044457617071, "mse_loss": 0.08042175322771072, "step": 6980 }, { "epoch": 0.8286899822169532, "grad_norm": 1.171875, "learning_rate": 0.0001992376720709967, "loss": 0.8799, "step": 6990 }, { "contrastive_loss": 3.89794921875, "epoch": 0.8286899822169532, "mse_loss": 0.06872071325778961, "step": 6990 }, { "epoch": 0.8298755186721992, "grad_norm": 0.482421875, "learning_rate": 0.00019923256919400533, "loss": 0.8714, "step": 7000 }, { "contrastive_loss": 4.0052490234375, "epoch": 0.8298755186721992, "mse_loss": 0.09404142946004868, "step": 7000 }, { "epoch": 0.8310610551274452, "grad_norm": 0.5390625, "learning_rate": 0.0001992274493608819, "loss": 0.8974, "step": 7010 }, { "contrastive_loss": 3.9808349609375, "epoch": 0.8310610551274452, "mse_loss": 0.07421066612005234, "step": 7010 }, { "epoch": 0.8322465915826912, "grad_norm": 0.458984375, "learning_rate": 0.00019922231257250123, "loss": 0.8714, "step": 7020 }, { "contrastive_loss": 4.057861328125, "epoch": 0.8322465915826912, "mse_loss": 0.06741409003734589, "step": 7020 }, { "epoch": 0.8334321280379372, "grad_norm": 0.53125, "learning_rate": 0.00019921715882974112, "loss": 0.873, "step": 7030 }, { "contrastive_loss": 3.949462890625, "epoch": 0.8334321280379372, "mse_loss": 0.1255863904953003, "step": 7030 }, { "epoch": 0.8346176644931832, "grad_norm": 0.439453125, "learning_rate": 0.00019921198813348213, "loss": 0.8892, "step": 7040 }, { "contrastive_loss": 3.9429931640625, "epoch": 0.8346176644931832, "mse_loss": 0.06009306758642197, "step": 7040 }, { "epoch": 0.8358032009484292, "grad_norm": 0.546875, "learning_rate": 0.00019920680048460786, "loss": 0.8838, "step": 7050 }, { "contrastive_loss": 4.0718994140625, "epoch": 0.8358032009484292, "mse_loss": 0.06266400218009949, "step": 7050 }, { "epoch": 0.8369887374036752, "grad_norm": 0.482421875, "learning_rate": 0.00019920159588400463, "loss": 0.8753, "step": 7060 }, { "contrastive_loss": 4.0604248046875, "epoch": 0.8369887374036752, "mse_loss": 0.06994061172008514, "step": 7060 }, { "epoch": 0.8381742738589212, "grad_norm": 0.4375, "learning_rate": 0.00019919637433256192, "loss": 0.8788, "step": 7070 }, { "contrastive_loss": 3.899169921875, "epoch": 0.8381742738589212, "mse_loss": 0.07394979894161224, "step": 7070 }, { "epoch": 0.8393598103141672, "grad_norm": 0.458984375, "learning_rate": 0.0001991911358311718, "loss": 0.868, "step": 7080 }, { "contrastive_loss": 4.0892333984375, "epoch": 0.8393598103141672, "mse_loss": 0.06949629634618759, "step": 7080 }, { "epoch": 0.8405453467694132, "grad_norm": 0.5078125, "learning_rate": 0.00019918588038072944, "loss": 0.8852, "step": 7090 }, { "contrastive_loss": 4.0762939453125, "epoch": 0.8405453467694132, "mse_loss": 0.09896961599588394, "step": 7090 }, { "epoch": 0.8417308832246592, "grad_norm": 0.49609375, "learning_rate": 0.00019918060798213293, "loss": 0.8798, "step": 7100 }, { "contrastive_loss": 3.8751220703125, "epoch": 0.8417308832246592, "mse_loss": 0.09112872928380966, "step": 7100 }, { "epoch": 0.8429164196799052, "grad_norm": 0.482421875, "learning_rate": 0.00019917531863628305, "loss": 0.8927, "step": 7110 }, { "contrastive_loss": 3.986328125, "epoch": 0.8429164196799052, "mse_loss": 0.08654900640249252, "step": 7110 }, { "epoch": 0.8441019561351512, "grad_norm": 0.5546875, "learning_rate": 0.0001991700123440837, "loss": 0.8746, "step": 7120 }, { "contrastive_loss": 3.9913330078125, "epoch": 0.8441019561351512, "mse_loss": 0.08112975209951401, "step": 7120 }, { "epoch": 0.8452874925903971, "grad_norm": 0.5546875, "learning_rate": 0.0001991646891064415, "loss": 0.8754, "step": 7130 }, { "contrastive_loss": 4.139404296875, "epoch": 0.8452874925903971, "mse_loss": 0.07696057111024857, "step": 7130 }, { "epoch": 0.8464730290456431, "grad_norm": 0.55078125, "learning_rate": 0.00019915934892426616, "loss": 0.885, "step": 7140 }, { "contrastive_loss": 3.9735107421875, "epoch": 0.8464730290456431, "mse_loss": 0.1014106273651123, "step": 7140 }, { "epoch": 0.8476585655008891, "grad_norm": 0.49609375, "learning_rate": 0.00019915399179847002, "loss": 0.8693, "step": 7150 }, { "contrastive_loss": 3.8768310546875, "epoch": 0.8476585655008891, "mse_loss": 0.08862661570310593, "step": 7150 }, { "epoch": 0.8488441019561351, "grad_norm": 0.5546875, "learning_rate": 0.00019914861772996862, "loss": 0.8661, "step": 7160 }, { "contrastive_loss": 3.95068359375, "epoch": 0.8488441019561351, "mse_loss": 0.07622572034597397, "step": 7160 }, { "epoch": 0.8500296384113811, "grad_norm": 0.58984375, "learning_rate": 0.00019914322671968015, "loss": 0.8695, "step": 7170 }, { "contrastive_loss": 3.9306640625, "epoch": 0.8500296384113811, "mse_loss": 0.09148304909467697, "step": 7170 }, { "epoch": 0.8512151748666271, "grad_norm": 0.390625, "learning_rate": 0.00019913781876852583, "loss": 0.8766, "step": 7180 }, { "contrastive_loss": 3.9251708984375, "epoch": 0.8512151748666271, "mse_loss": 0.06774355471134186, "step": 7180 }, { "epoch": 0.8524007113218731, "grad_norm": 0.625, "learning_rate": 0.00019913239387742964, "loss": 0.8827, "step": 7190 }, { "contrastive_loss": 4.023681640625, "epoch": 0.8524007113218731, "mse_loss": 0.07086292654275894, "step": 7190 }, { "epoch": 0.8535862477771191, "grad_norm": 0.48828125, "learning_rate": 0.00019912695204731868, "loss": 0.8854, "step": 7200 }, { "contrastive_loss": 4.0235595703125, "epoch": 0.8535862477771191, "mse_loss": 0.0724741742014885, "step": 7200 }, { "epoch": 0.8547717842323651, "grad_norm": 0.67578125, "learning_rate": 0.0001991214932791227, "loss": 0.8743, "step": 7210 }, { "contrastive_loss": 3.9183349609375, "epoch": 0.8547717842323651, "mse_loss": 0.08133649826049805, "step": 7210 }, { "epoch": 0.8559573206876111, "grad_norm": 0.5234375, "learning_rate": 0.00019911601757377452, "loss": 0.8781, "step": 7220 }, { "contrastive_loss": 4.0057373046875, "epoch": 0.8559573206876111, "mse_loss": 0.08267121762037277, "step": 7220 }, { "epoch": 0.8571428571428571, "grad_norm": 0.6328125, "learning_rate": 0.00019911052493220977, "loss": 0.8754, "step": 7230 }, { "contrastive_loss": 3.9173583984375, "epoch": 0.8571428571428571, "mse_loss": 0.07501637935638428, "step": 7230 }, { "epoch": 0.8583283935981031, "grad_norm": 0.484375, "learning_rate": 0.00019910501535536697, "loss": 0.8748, "step": 7240 }, { "contrastive_loss": 4.0322265625, "epoch": 0.8583283935981031, "mse_loss": 0.08525625616312027, "step": 7240 }, { "epoch": 0.8595139300533492, "grad_norm": 0.46484375, "learning_rate": 0.0001990994888441876, "loss": 0.8627, "step": 7250 }, { "contrastive_loss": 3.9691162109375, "epoch": 0.8595139300533492, "mse_loss": 0.1059809997677803, "step": 7250 }, { "epoch": 0.8606994665085952, "grad_norm": 0.46484375, "learning_rate": 0.00019909394539961595, "loss": 0.8768, "step": 7260 }, { "contrastive_loss": 3.947265625, "epoch": 0.8606994665085952, "mse_loss": 0.08521658927202225, "step": 7260 }, { "epoch": 0.8618850029638412, "grad_norm": 0.48828125, "learning_rate": 0.00019908838502259924, "loss": 0.8716, "step": 7270 }, { "contrastive_loss": 4.0823974609375, "epoch": 0.8618850029638412, "mse_loss": 0.07908736169338226, "step": 7270 }, { "epoch": 0.8630705394190872, "grad_norm": 0.59765625, "learning_rate": 0.0001990828077140876, "loss": 0.8716, "step": 7280 }, { "contrastive_loss": 3.9091796875, "epoch": 0.8630705394190872, "mse_loss": 0.0717579573392868, "step": 7280 }, { "epoch": 0.8642560758743332, "grad_norm": 0.5390625, "learning_rate": 0.00019907721347503407, "loss": 0.8706, "step": 7290 }, { "contrastive_loss": 3.9755859375, "epoch": 0.8642560758743332, "mse_loss": 0.08684612065553665, "step": 7290 }, { "epoch": 0.8654416123295792, "grad_norm": 0.53515625, "learning_rate": 0.0001990716023063945, "loss": 0.8779, "step": 7300 }, { "contrastive_loss": 3.8814697265625, "epoch": 0.8654416123295792, "mse_loss": 0.07823912799358368, "step": 7300 }, { "epoch": 0.8666271487848252, "grad_norm": 0.5625, "learning_rate": 0.00019906597420912774, "loss": 0.8679, "step": 7310 }, { "contrastive_loss": 3.9383544921875, "epoch": 0.8666271487848252, "mse_loss": 0.07723821699619293, "step": 7310 }, { "epoch": 0.8678126852400712, "grad_norm": 0.53515625, "learning_rate": 0.00019906032918419543, "loss": 0.8785, "step": 7320 }, { "contrastive_loss": 3.84716796875, "epoch": 0.8678126852400712, "mse_loss": 0.08632920682430267, "step": 7320 }, { "epoch": 0.8689982216953172, "grad_norm": 0.56640625, "learning_rate": 0.00019905466723256217, "loss": 0.8762, "step": 7330 }, { "contrastive_loss": 3.9537353515625, "epoch": 0.8689982216953172, "mse_loss": 0.07204283773899078, "step": 7330 }, { "epoch": 0.8701837581505631, "grad_norm": 0.458984375, "learning_rate": 0.00019904898835519544, "loss": 0.8651, "step": 7340 }, { "contrastive_loss": 4.0133056640625, "epoch": 0.8701837581505631, "mse_loss": 0.09295908361673355, "step": 7340 }, { "epoch": 0.8713692946058091, "grad_norm": 0.48828125, "learning_rate": 0.00019904329255306558, "loss": 0.8746, "step": 7350 }, { "contrastive_loss": 3.9068603515625, "epoch": 0.8713692946058091, "mse_loss": 0.07248224318027496, "step": 7350 }, { "epoch": 0.8725548310610551, "grad_norm": 0.42578125, "learning_rate": 0.00019903757982714585, "loss": 0.8701, "step": 7360 }, { "contrastive_loss": 3.96875, "epoch": 0.8725548310610551, "mse_loss": 0.11771351844072342, "step": 7360 }, { "epoch": 0.8737403675163011, "grad_norm": 0.439453125, "learning_rate": 0.00019903185017841244, "loss": 0.8818, "step": 7370 }, { "contrastive_loss": 3.8651123046875, "epoch": 0.8737403675163011, "mse_loss": 0.0963180884718895, "step": 7370 }, { "epoch": 0.8749259039715471, "grad_norm": 0.392578125, "learning_rate": 0.00019902610360784438, "loss": 0.8723, "step": 7380 }, { "contrastive_loss": 3.8702392578125, "epoch": 0.8749259039715471, "mse_loss": 0.08259040862321854, "step": 7380 }, { "epoch": 0.8761114404267931, "grad_norm": 0.4609375, "learning_rate": 0.00019902034011642355, "loss": 0.8757, "step": 7390 }, { "contrastive_loss": 3.9901123046875, "epoch": 0.8761114404267931, "mse_loss": 0.07634011656045914, "step": 7390 }, { "epoch": 0.8772969768820391, "grad_norm": 0.5234375, "learning_rate": 0.0001990145597051348, "loss": 0.8762, "step": 7400 }, { "contrastive_loss": 3.9609375, "epoch": 0.8772969768820391, "mse_loss": 0.0662570372223854, "step": 7400 }, { "epoch": 0.8784825133372851, "grad_norm": 0.51171875, "learning_rate": 0.00019900876237496587, "loss": 0.8612, "step": 7410 }, { "contrastive_loss": 3.940673828125, "epoch": 0.8784825133372851, "mse_loss": 0.09315948188304901, "step": 7410 }, { "epoch": 0.8796680497925311, "grad_norm": 0.4921875, "learning_rate": 0.00019900294812690732, "loss": 0.8698, "step": 7420 }, { "contrastive_loss": 4.0216064453125, "epoch": 0.8796680497925311, "mse_loss": 0.07822944223880768, "step": 7420 }, { "epoch": 0.8808535862477771, "grad_norm": 0.443359375, "learning_rate": 0.0001989971169619527, "loss": 0.8717, "step": 7430 }, { "contrastive_loss": 3.9720458984375, "epoch": 0.8808535862477771, "mse_loss": 0.08388954401016235, "step": 7430 }, { "epoch": 0.8820391227030231, "grad_norm": 0.7109375, "learning_rate": 0.00019899126888109833, "loss": 0.8704, "step": 7440 }, { "contrastive_loss": 3.917236328125, "epoch": 0.8820391227030231, "mse_loss": 0.08443251997232437, "step": 7440 }, { "epoch": 0.8832246591582691, "grad_norm": 0.6328125, "learning_rate": 0.00019898540388534357, "loss": 0.8611, "step": 7450 }, { "contrastive_loss": 4.12255859375, "epoch": 0.8832246591582691, "mse_loss": 0.04405950382351875, "step": 7450 }, { "epoch": 0.8844101956135151, "grad_norm": 0.5390625, "learning_rate": 0.00019897952197569052, "loss": 0.8601, "step": 7460 }, { "contrastive_loss": 4.00927734375, "epoch": 0.8844101956135151, "mse_loss": 0.1427246630191803, "step": 7460 }, { "epoch": 0.8855957320687611, "grad_norm": 0.5703125, "learning_rate": 0.00019897362315314426, "loss": 0.8899, "step": 7470 }, { "contrastive_loss": 3.9700927734375, "epoch": 0.8855957320687611, "mse_loss": 0.07597699016332626, "step": 7470 }, { "epoch": 0.8867812685240071, "grad_norm": 0.458984375, "learning_rate": 0.00019896770741871275, "loss": 0.8711, "step": 7480 }, { "contrastive_loss": 4.0257568359375, "epoch": 0.8867812685240071, "mse_loss": 0.06806308776140213, "step": 7480 }, { "epoch": 0.8879668049792531, "grad_norm": 0.46875, "learning_rate": 0.0001989617747734068, "loss": 0.8799, "step": 7490 }, { "contrastive_loss": 3.94970703125, "epoch": 0.8879668049792531, "mse_loss": 0.08193813264369965, "step": 7490 }, { "epoch": 0.8891523414344991, "grad_norm": 0.578125, "learning_rate": 0.00019895582521824019, "loss": 0.8853, "step": 7500 }, { "contrastive_loss": 3.869873046875, "epoch": 0.8891523414344991, "mse_loss": 0.07987262308597565, "step": 7500 }, { "epoch": 0.890337877889745, "grad_norm": 0.53125, "learning_rate": 0.00019894985875422948, "loss": 0.8631, "step": 7510 }, { "contrastive_loss": 3.85400390625, "epoch": 0.890337877889745, "mse_loss": 0.08846213668584824, "step": 7510 }, { "epoch": 0.8915234143449912, "grad_norm": 0.419921875, "learning_rate": 0.00019894387538239413, "loss": 0.8716, "step": 7520 }, { "contrastive_loss": 3.961181640625, "epoch": 0.8915234143449912, "mse_loss": 0.052546076476573944, "step": 7520 }, { "epoch": 0.8927089508002372, "grad_norm": 0.515625, "learning_rate": 0.00019893787510375668, "loss": 0.8675, "step": 7530 }, { "contrastive_loss": 4.050537109375, "epoch": 0.8927089508002372, "mse_loss": 0.08889379352331161, "step": 7530 }, { "epoch": 0.8938944872554832, "grad_norm": 0.36328125, "learning_rate": 0.0001989318579193423, "loss": 0.8786, "step": 7540 }, { "contrastive_loss": 3.9508056640625, "epoch": 0.8938944872554832, "mse_loss": 0.0710422694683075, "step": 7540 }, { "epoch": 0.8950800237107291, "grad_norm": 0.482421875, "learning_rate": 0.0001989258238301792, "loss": 0.8688, "step": 7550 }, { "contrastive_loss": 3.99658203125, "epoch": 0.8950800237107291, "mse_loss": 0.0828033834695816, "step": 7550 }, { "epoch": 0.8962655601659751, "grad_norm": 0.453125, "learning_rate": 0.0001989197728372984, "loss": 0.8717, "step": 7560 }, { "contrastive_loss": 3.793701171875, "epoch": 0.8962655601659751, "mse_loss": 0.07616538554430008, "step": 7560 }, { "epoch": 0.8974510966212211, "grad_norm": 0.5, "learning_rate": 0.00019891370494173392, "loss": 0.8573, "step": 7570 }, { "contrastive_loss": 3.98681640625, "epoch": 0.8974510966212211, "mse_loss": 0.07646708190441132, "step": 7570 }, { "epoch": 0.8986366330764671, "grad_norm": 0.54296875, "learning_rate": 0.00019890762014452258, "loss": 0.8893, "step": 7580 }, { "contrastive_loss": 4.02587890625, "epoch": 0.8986366330764671, "mse_loss": 0.04784423112869263, "step": 7580 }, { "epoch": 0.8998221695317131, "grad_norm": 0.451171875, "learning_rate": 0.00019890151844670405, "loss": 0.8689, "step": 7590 }, { "contrastive_loss": 4.0281982421875, "epoch": 0.8998221695317131, "mse_loss": 0.06719255447387695, "step": 7590 }, { "epoch": 0.9010077059869591, "grad_norm": 0.59375, "learning_rate": 0.00019889539984932098, "loss": 0.8806, "step": 7600 }, { "contrastive_loss": 3.9395751953125, "epoch": 0.9010077059869591, "mse_loss": 0.04324718937277794, "step": 7600 }, { "epoch": 0.9021932424422051, "grad_norm": 0.396484375, "learning_rate": 0.0001988892643534189, "loss": 0.866, "step": 7610 }, { "contrastive_loss": 3.959716796875, "epoch": 0.9021932424422051, "mse_loss": 0.09168402850627899, "step": 7610 }, { "epoch": 0.9033787788974511, "grad_norm": 0.609375, "learning_rate": 0.00019888311196004615, "loss": 0.8755, "step": 7620 }, { "contrastive_loss": 4.0341796875, "epoch": 0.9033787788974511, "mse_loss": 0.06550446897745132, "step": 7620 }, { "epoch": 0.9045643153526971, "grad_norm": 0.427734375, "learning_rate": 0.00019887694267025401, "loss": 0.8823, "step": 7630 }, { "contrastive_loss": 3.9371337890625, "epoch": 0.9045643153526971, "mse_loss": 0.08568640798330307, "step": 7630 }, { "epoch": 0.9057498518079431, "grad_norm": 0.390625, "learning_rate": 0.00019887075648509668, "loss": 0.8824, "step": 7640 }, { "contrastive_loss": 4.06396484375, "epoch": 0.9057498518079431, "mse_loss": 0.09704472124576569, "step": 7640 }, { "epoch": 0.9069353882631891, "grad_norm": 0.5078125, "learning_rate": 0.00019886455340563117, "loss": 0.8874, "step": 7650 }, { "contrastive_loss": 3.9991455078125, "epoch": 0.9069353882631891, "mse_loss": 0.08281542360782623, "step": 7650 }, { "epoch": 0.9081209247184351, "grad_norm": 0.494140625, "learning_rate": 0.00019885833343291745, "loss": 0.8699, "step": 7660 }, { "contrastive_loss": 3.88720703125, "epoch": 0.9081209247184351, "mse_loss": 0.08323652297258377, "step": 7660 }, { "epoch": 0.9093064611736811, "grad_norm": 0.46484375, "learning_rate": 0.00019885209656801832, "loss": 0.8654, "step": 7670 }, { "contrastive_loss": 4.0469970703125, "epoch": 0.9093064611736811, "mse_loss": 0.06904835999011993, "step": 7670 }, { "epoch": 0.9104919976289271, "grad_norm": 0.5078125, "learning_rate": 0.0001988458428119995, "loss": 0.8678, "step": 7680 }, { "contrastive_loss": 3.902099609375, "epoch": 0.9104919976289271, "mse_loss": 0.0816688984632492, "step": 7680 }, { "epoch": 0.9116775340841731, "grad_norm": 0.5078125, "learning_rate": 0.0001988395721659296, "loss": 0.8606, "step": 7690 }, { "contrastive_loss": 4.031982421875, "epoch": 0.9116775340841731, "mse_loss": 0.07651132345199585, "step": 7690 }, { "epoch": 0.9128630705394191, "grad_norm": 0.49609375, "learning_rate": 0.00019883328463088008, "loss": 0.8807, "step": 7700 }, { "contrastive_loss": 3.9453125, "epoch": 0.9128630705394191, "mse_loss": 0.0660691186785698, "step": 7700 }, { "epoch": 0.9140486069946651, "grad_norm": 0.48828125, "learning_rate": 0.00019882698020792528, "loss": 0.8726, "step": 7710 }, { "contrastive_loss": 3.9842529296875, "epoch": 0.9140486069946651, "mse_loss": 0.0789315477013588, "step": 7710 }, { "epoch": 0.915234143449911, "grad_norm": 0.435546875, "learning_rate": 0.0001988206588981425, "loss": 0.8782, "step": 7720 }, { "contrastive_loss": 3.8587646484375, "epoch": 0.915234143449911, "mse_loss": 0.07360893487930298, "step": 7720 }, { "epoch": 0.916419679905157, "grad_norm": 0.5078125, "learning_rate": 0.0001988143207026119, "loss": 0.8676, "step": 7730 }, { "contrastive_loss": 3.902099609375, "epoch": 0.916419679905157, "mse_loss": 0.07998853176832199, "step": 7730 }, { "epoch": 0.917605216360403, "grad_norm": 0.412109375, "learning_rate": 0.00019880796562241643, "loss": 0.8732, "step": 7740 }, { "contrastive_loss": 3.8587646484375, "epoch": 0.917605216360403, "mse_loss": 0.06707847118377686, "step": 7740 }, { "epoch": 0.918790752815649, "grad_norm": 0.48046875, "learning_rate": 0.00019880159365864204, "loss": 0.8803, "step": 7750 }, { "contrastive_loss": 3.892333984375, "epoch": 0.918790752815649, "mse_loss": 0.08801264315843582, "step": 7750 }, { "epoch": 0.919976289270895, "grad_norm": 0.5546875, "learning_rate": 0.00019879520481237754, "loss": 0.8695, "step": 7760 }, { "contrastive_loss": 3.9993896484375, "epoch": 0.919976289270895, "mse_loss": 0.07136140018701553, "step": 7760 }, { "epoch": 0.921161825726141, "grad_norm": 0.41796875, "learning_rate": 0.00019878879908471458, "loss": 0.8625, "step": 7770 }, { "contrastive_loss": 3.9364013671875, "epoch": 0.921161825726141, "mse_loss": 0.11461619287729263, "step": 7770 }, { "epoch": 0.9223473621813871, "grad_norm": 0.44140625, "learning_rate": 0.00019878237647674775, "loss": 0.8706, "step": 7780 }, { "contrastive_loss": 3.9237060546875, "epoch": 0.9223473621813871, "mse_loss": 0.09091413766145706, "step": 7780 }, { "epoch": 0.9235328986366331, "grad_norm": 0.458984375, "learning_rate": 0.0001987759369895745, "loss": 0.8698, "step": 7790 }, { "contrastive_loss": 3.9736328125, "epoch": 0.9235328986366331, "mse_loss": 0.052919983863830566, "step": 7790 }, { "epoch": 0.9247184350918791, "grad_norm": 0.349609375, "learning_rate": 0.0001987694806242951, "loss": 0.8631, "step": 7800 }, { "contrastive_loss": 3.904296875, "epoch": 0.9247184350918791, "mse_loss": 0.06738094985485077, "step": 7800 }, { "epoch": 0.9259039715471251, "grad_norm": 0.435546875, "learning_rate": 0.00019876300738201286, "loss": 0.8666, "step": 7810 }, { "contrastive_loss": 3.932861328125, "epoch": 0.9259039715471251, "mse_loss": 0.06182248145341873, "step": 7810 }, { "epoch": 0.9270895080023711, "grad_norm": 0.47265625, "learning_rate": 0.0001987565172638338, "loss": 0.8755, "step": 7820 }, { "contrastive_loss": 3.998046875, "epoch": 0.9270895080023711, "mse_loss": 0.07264489680528641, "step": 7820 }, { "epoch": 0.9282750444576171, "grad_norm": 0.546875, "learning_rate": 0.00019875001027086695, "loss": 0.889, "step": 7830 }, { "contrastive_loss": 3.9605712890625, "epoch": 0.9282750444576171, "mse_loss": 0.056242313235998154, "step": 7830 }, { "epoch": 0.9294605809128631, "grad_norm": 0.52734375, "learning_rate": 0.00019874348640422414, "loss": 0.8665, "step": 7840 }, { "contrastive_loss": 4.072265625, "epoch": 0.9294605809128631, "mse_loss": 0.06292258203029633, "step": 7840 }, { "epoch": 0.9306461173681091, "grad_norm": 0.50390625, "learning_rate": 0.00019873694566502017, "loss": 0.8739, "step": 7850 }, { "contrastive_loss": 4.0494384765625, "epoch": 0.9306461173681091, "mse_loss": 0.09246693551540375, "step": 7850 }, { "epoch": 0.9318316538233551, "grad_norm": 0.64453125, "learning_rate": 0.00019873038805437264, "loss": 0.8692, "step": 7860 }, { "contrastive_loss": 3.9698486328125, "epoch": 0.9318316538233551, "mse_loss": 0.12287264317274094, "step": 7860 }, { "epoch": 0.9330171902786011, "grad_norm": 0.443359375, "learning_rate": 0.00019872381357340205, "loss": 0.8698, "step": 7870 }, { "contrastive_loss": 3.959716796875, "epoch": 0.9330171902786011, "mse_loss": 0.0760856494307518, "step": 7870 }, { "epoch": 0.9342027267338471, "grad_norm": 0.58203125, "learning_rate": 0.00019871722222323187, "loss": 0.8614, "step": 7880 }, { "contrastive_loss": 3.969482421875, "epoch": 0.9342027267338471, "mse_loss": 0.09494196623563766, "step": 7880 }, { "epoch": 0.9353882631890931, "grad_norm": 0.423828125, "learning_rate": 0.00019871061400498832, "loss": 0.8766, "step": 7890 }, { "contrastive_loss": 4.14208984375, "epoch": 0.9353882631890931, "mse_loss": 0.09949304163455963, "step": 7890 }, { "epoch": 0.9365737996443391, "grad_norm": 0.4609375, "learning_rate": 0.00019870398891980057, "loss": 0.8692, "step": 7900 }, { "contrastive_loss": 3.9344482421875, "epoch": 0.9365737996443391, "mse_loss": 0.06149638071656227, "step": 7900 }, { "epoch": 0.9377593360995851, "grad_norm": 0.421875, "learning_rate": 0.00019869734696880065, "loss": 0.8841, "step": 7910 }, { "contrastive_loss": 3.904052734375, "epoch": 0.9377593360995851, "mse_loss": 0.0889023169875145, "step": 7910 }, { "epoch": 0.9389448725548311, "grad_norm": 0.671875, "learning_rate": 0.00019869068815312352, "loss": 0.8787, "step": 7920 }, { "contrastive_loss": 3.8848876953125, "epoch": 0.9389448725548311, "mse_loss": 0.07460921257734299, "step": 7920 }, { "epoch": 0.940130409010077, "grad_norm": 0.62109375, "learning_rate": 0.000198684012473907, "loss": 0.863, "step": 7930 }, { "contrastive_loss": 3.9483642578125, "epoch": 0.940130409010077, "mse_loss": 0.09383571147918701, "step": 7930 }, { "epoch": 0.941315945465323, "grad_norm": 0.4609375, "learning_rate": 0.00019867731993229178, "loss": 0.8793, "step": 7940 }, { "contrastive_loss": 4.05078125, "epoch": 0.941315945465323, "mse_loss": 0.1267252117395401, "step": 7940 }, { "epoch": 0.942501481920569, "grad_norm": 0.50390625, "learning_rate": 0.00019867061052942136, "loss": 0.8803, "step": 7950 }, { "contrastive_loss": 3.972412109375, "epoch": 0.942501481920569, "mse_loss": 0.1276707798242569, "step": 7950 }, { "epoch": 0.943687018375815, "grad_norm": 0.470703125, "learning_rate": 0.0001986638842664423, "loss": 0.8808, "step": 7960 }, { "contrastive_loss": 3.99365234375, "epoch": 0.943687018375815, "mse_loss": 0.082585409283638, "step": 7960 }, { "epoch": 0.944872554831061, "grad_norm": 0.51171875, "learning_rate": 0.00019865714114450383, "loss": 0.8776, "step": 7970 }, { "contrastive_loss": 3.941162109375, "epoch": 0.944872554831061, "mse_loss": 0.08361498266458511, "step": 7970 }, { "epoch": 0.946058091286307, "grad_norm": 0.515625, "learning_rate": 0.00019865038116475823, "loss": 0.8836, "step": 7980 }, { "contrastive_loss": 3.9091796875, "epoch": 0.946058091286307, "mse_loss": 0.09571681916713715, "step": 7980 }, { "epoch": 0.947243627741553, "grad_norm": 0.458984375, "learning_rate": 0.00019864360432836063, "loss": 0.8839, "step": 7990 }, { "contrastive_loss": 3.9482421875, "epoch": 0.947243627741553, "mse_loss": 0.09676969051361084, "step": 7990 }, { "epoch": 0.948429164196799, "grad_norm": 0.52734375, "learning_rate": 0.00019863681063646892, "loss": 0.8747, "step": 8000 }, { "contrastive_loss": 4.0699462890625, "epoch": 0.948429164196799, "mse_loss": 0.09440547972917557, "step": 8000 }, { "epoch": 0.949614700652045, "grad_norm": 0.39453125, "learning_rate": 0.000198630000090244, "loss": 0.8679, "step": 8010 }, { "contrastive_loss": 3.86962890625, "epoch": 0.949614700652045, "mse_loss": 0.0640212744474411, "step": 8010 }, { "epoch": 0.950800237107291, "grad_norm": 0.470703125, "learning_rate": 0.00019862317269084962, "loss": 0.8605, "step": 8020 }, { "contrastive_loss": 4.00341796875, "epoch": 0.950800237107291, "mse_loss": 0.1225491389632225, "step": 8020 }, { "epoch": 0.951985773562537, "grad_norm": 0.5546875, "learning_rate": 0.00019861632843945235, "loss": 0.8715, "step": 8030 }, { "contrastive_loss": 3.8504638671875, "epoch": 0.951985773562537, "mse_loss": 0.06600511819124222, "step": 8030 }, { "epoch": 0.9531713100177831, "grad_norm": 0.35546875, "learning_rate": 0.00019860946733722172, "loss": 0.8618, "step": 8040 }, { "contrastive_loss": 3.8358154296875, "epoch": 0.9531713100177831, "mse_loss": 0.08473344892263412, "step": 8040 }, { "epoch": 0.9543568464730291, "grad_norm": 0.453125, "learning_rate": 0.0001986025893853301, "loss": 0.8599, "step": 8050 }, { "contrastive_loss": 3.9114990234375, "epoch": 0.9543568464730291, "mse_loss": 0.06881146878004074, "step": 8050 }, { "epoch": 0.9555423829282751, "grad_norm": 0.490234375, "learning_rate": 0.00019859569458495276, "loss": 0.8638, "step": 8060 }, { "contrastive_loss": 3.9659423828125, "epoch": 0.9555423829282751, "mse_loss": 0.07199494540691376, "step": 8060 }, { "epoch": 0.9567279193835211, "grad_norm": 0.373046875, "learning_rate": 0.00019858878293726778, "loss": 0.8705, "step": 8070 }, { "contrastive_loss": 3.954345703125, "epoch": 0.9567279193835211, "mse_loss": 0.06986123323440552, "step": 8070 }, { "epoch": 0.9579134558387671, "grad_norm": 0.458984375, "learning_rate": 0.0001985818544434562, "loss": 0.8682, "step": 8080 }, { "contrastive_loss": 3.903564453125, "epoch": 0.9579134558387671, "mse_loss": 0.07034090906381607, "step": 8080 }, { "epoch": 0.9590989922940131, "grad_norm": 0.4921875, "learning_rate": 0.00019857490910470195, "loss": 0.8625, "step": 8090 }, { "contrastive_loss": 3.9696044921875, "epoch": 0.9590989922940131, "mse_loss": 0.08119017630815506, "step": 8090 }, { "epoch": 0.9602845287492591, "grad_norm": 0.3984375, "learning_rate": 0.00019856794692219175, "loss": 0.8683, "step": 8100 }, { "contrastive_loss": 3.98681640625, "epoch": 0.9602845287492591, "mse_loss": 0.07148043066263199, "step": 8100 }, { "epoch": 0.9614700652045051, "grad_norm": 0.482421875, "learning_rate": 0.00019856096789711524, "loss": 0.8679, "step": 8110 }, { "contrastive_loss": 3.9595947265625, "epoch": 0.9614700652045051, "mse_loss": 0.08519626408815384, "step": 8110 }, { "epoch": 0.9626556016597511, "grad_norm": 0.49609375, "learning_rate": 0.000198553972030665, "loss": 0.8713, "step": 8120 }, { "contrastive_loss": 3.999267578125, "epoch": 0.9626556016597511, "mse_loss": 0.06773719191551208, "step": 8120 }, { "epoch": 0.963841138114997, "grad_norm": 0.462890625, "learning_rate": 0.00019854695932403638, "loss": 0.8626, "step": 8130 }, { "contrastive_loss": 3.9453125, "epoch": 0.963841138114997, "mse_loss": 0.08847074955701828, "step": 8130 }, { "epoch": 0.965026674570243, "grad_norm": 0.4609375, "learning_rate": 0.00019853992977842766, "loss": 0.8802, "step": 8140 }, { "contrastive_loss": 4.12841796875, "epoch": 0.965026674570243, "mse_loss": 0.08217824995517731, "step": 8140 }, { "epoch": 0.966212211025489, "grad_norm": 0.52734375, "learning_rate": 0.00019853288339504002, "loss": 0.8794, "step": 8150 }, { "contrastive_loss": 3.8697509765625, "epoch": 0.966212211025489, "mse_loss": 0.09609048068523407, "step": 8150 }, { "epoch": 0.967397747480735, "grad_norm": 0.451171875, "learning_rate": 0.0001985258201750775, "loss": 0.8683, "step": 8160 }, { "contrastive_loss": 3.912353515625, "epoch": 0.967397747480735, "mse_loss": 0.08172322809696198, "step": 8160 }, { "epoch": 0.968583283935981, "grad_norm": 0.484375, "learning_rate": 0.000198518740119747, "loss": 0.8708, "step": 8170 }, { "contrastive_loss": 3.7838134765625, "epoch": 0.968583283935981, "mse_loss": 0.08650754392147064, "step": 8170 }, { "epoch": 0.969768820391227, "grad_norm": 0.57421875, "learning_rate": 0.0001985116432302583, "loss": 0.8594, "step": 8180 }, { "contrastive_loss": 3.994873046875, "epoch": 0.969768820391227, "mse_loss": 0.08085180819034576, "step": 8180 }, { "epoch": 0.970954356846473, "grad_norm": 0.5390625, "learning_rate": 0.0001985045295078241, "loss": 0.8773, "step": 8190 }, { "contrastive_loss": 4.0657958984375, "epoch": 0.970954356846473, "mse_loss": 0.08635701984167099, "step": 8190 }, { "epoch": 0.972139893301719, "grad_norm": 0.51171875, "learning_rate": 0.00019849739895365986, "loss": 0.8756, "step": 8200 }, { "contrastive_loss": 3.9144287109375, "epoch": 0.972139893301719, "mse_loss": 0.07517725974321365, "step": 8200 }, { "epoch": 0.973325429756965, "grad_norm": 0.50390625, "learning_rate": 0.00019849025156898407, "loss": 0.8732, "step": 8210 }, { "contrastive_loss": 3.8656005859375, "epoch": 0.973325429756965, "mse_loss": 0.0972118005156517, "step": 8210 }, { "epoch": 0.974510966212211, "grad_norm": 0.765625, "learning_rate": 0.00019848308735501803, "loss": 0.8773, "step": 8220 }, { "contrastive_loss": 3.926025390625, "epoch": 0.974510966212211, "mse_loss": 0.06517840921878815, "step": 8220 }, { "epoch": 0.975696502667457, "grad_norm": 0.439453125, "learning_rate": 0.00019847590631298585, "loss": 0.8748, "step": 8230 }, { "contrastive_loss": 4.01904296875, "epoch": 0.975696502667457, "mse_loss": 0.08118437230587006, "step": 8230 }, { "epoch": 0.976882039122703, "grad_norm": 0.451171875, "learning_rate": 0.0001984687084441146, "loss": 0.8638, "step": 8240 }, { "contrastive_loss": 3.9447021484375, "epoch": 0.976882039122703, "mse_loss": 0.08673649281263351, "step": 8240 }, { "epoch": 0.978067575577949, "grad_norm": 0.3984375, "learning_rate": 0.0001984614937496342, "loss": 0.8672, "step": 8250 }, { "contrastive_loss": 4.02001953125, "epoch": 0.978067575577949, "mse_loss": 0.057576682418584824, "step": 8250 }, { "epoch": 0.979253112033195, "grad_norm": 0.4140625, "learning_rate": 0.00019845426223077746, "loss": 0.8761, "step": 8260 }, { "contrastive_loss": 3.9736328125, "epoch": 0.979253112033195, "mse_loss": 0.07731092721223831, "step": 8260 }, { "epoch": 0.980438648488441, "grad_norm": 0.61328125, "learning_rate": 0.00019844701388878005, "loss": 0.8797, "step": 8270 }, { "contrastive_loss": 3.92626953125, "epoch": 0.980438648488441, "mse_loss": 0.07542704045772552, "step": 8270 }, { "epoch": 0.981624184943687, "grad_norm": 0.48046875, "learning_rate": 0.00019843974872488048, "loss": 0.8718, "step": 8280 }, { "contrastive_loss": 3.983642578125, "epoch": 0.981624184943687, "mse_loss": 0.10767959803342819, "step": 8280 }, { "epoch": 0.982809721398933, "grad_norm": 0.52734375, "learning_rate": 0.00019843246674032015, "loss": 0.8674, "step": 8290 }, { "contrastive_loss": 3.964599609375, "epoch": 0.982809721398933, "mse_loss": 0.051420144736766815, "step": 8290 }, { "epoch": 0.983995257854179, "grad_norm": 0.4375, "learning_rate": 0.00019842516793634345, "loss": 0.8635, "step": 8300 }, { "contrastive_loss": 3.99853515625, "epoch": 0.983995257854179, "mse_loss": 0.06638186424970627, "step": 8300 }, { "epoch": 0.9851807943094251, "grad_norm": 0.56640625, "learning_rate": 0.00019841785231419749, "loss": 0.8698, "step": 8310 }, { "contrastive_loss": 3.839599609375, "epoch": 0.9851807943094251, "mse_loss": 0.05485871806740761, "step": 8310 }, { "epoch": 0.9863663307646711, "grad_norm": 0.369140625, "learning_rate": 0.00019841051987513225, "loss": 0.8675, "step": 8320 }, { "contrastive_loss": 3.9859619140625, "epoch": 0.9863663307646711, "mse_loss": 0.04240485653281212, "step": 8320 }, { "epoch": 0.9875518672199171, "grad_norm": 0.37109375, "learning_rate": 0.00019840317062040072, "loss": 0.8644, "step": 8330 }, { "contrastive_loss": 4.0169677734375, "epoch": 0.9875518672199171, "mse_loss": 0.08211930841207504, "step": 8330 }, { "epoch": 0.988737403675163, "grad_norm": 0.60546875, "learning_rate": 0.00019839580455125865, "loss": 0.8666, "step": 8340 }, { "contrastive_loss": 3.9818115234375, "epoch": 0.988737403675163, "mse_loss": 0.07421641796827316, "step": 8340 }, { "epoch": 0.989922940130409, "grad_norm": 0.474609375, "learning_rate": 0.00019838842166896474, "loss": 0.8742, "step": 8350 }, { "contrastive_loss": 4.0218505859375, "epoch": 0.989922940130409, "mse_loss": 0.059489063918590546, "step": 8350 }, { "epoch": 0.991108476585655, "grad_norm": 0.49609375, "learning_rate": 0.00019838102197478044, "loss": 0.8691, "step": 8360 }, { "contrastive_loss": 3.967529296875, "epoch": 0.991108476585655, "mse_loss": 0.0771031603217125, "step": 8360 }, { "epoch": 0.992294013040901, "grad_norm": 0.5703125, "learning_rate": 0.00019837360546997028, "loss": 0.8646, "step": 8370 }, { "contrastive_loss": 3.82373046875, "epoch": 0.992294013040901, "mse_loss": 0.0629580169916153, "step": 8370 }, { "epoch": 0.993479549496147, "grad_norm": 0.66796875, "learning_rate": 0.00019836617215580145, "loss": 0.8776, "step": 8380 }, { "contrastive_loss": 3.8507080078125, "epoch": 0.993479549496147, "mse_loss": 0.04871120676398277, "step": 8380 }, { "epoch": 0.994665085951393, "grad_norm": 0.435546875, "learning_rate": 0.0001983587220335441, "loss": 0.866, "step": 8390 }, { "contrastive_loss": 3.7833251953125, "epoch": 0.994665085951393, "mse_loss": 0.09239651262760162, "step": 8390 }, { "epoch": 0.995850622406639, "grad_norm": 0.474609375, "learning_rate": 0.00019835125510447128, "loss": 0.8515, "step": 8400 }, { "contrastive_loss": 4.0078125, "epoch": 0.995850622406639, "mse_loss": 0.05646755173802376, "step": 8400 }, { "epoch": 0.997036158861885, "grad_norm": 0.443359375, "learning_rate": 0.00019834377136985888, "loss": 0.871, "step": 8410 }, { "contrastive_loss": 4.0174560546875, "epoch": 0.997036158861885, "mse_loss": 0.07951414585113525, "step": 8410 }, { "epoch": 0.998221695317131, "grad_norm": 0.404296875, "learning_rate": 0.00019833627083098567, "loss": 0.8635, "step": 8420 }, { "contrastive_loss": 4.0281982421875, "epoch": 0.998221695317131, "mse_loss": 0.095278799533844, "step": 8420 }, { "epoch": 0.999407231772377, "grad_norm": 0.61328125, "learning_rate": 0.00019832875348913326, "loss": 0.8633, "step": 8430 }, { "contrastive_loss": 3.9979248046875, "epoch": 0.999407231772377, "mse_loss": 0.07004760205745697, "step": 8430 }, { "epoch": 1.000592768227623, "grad_norm": 0.484375, "learning_rate": 0.00019832121934558616, "loss": 0.8697, "step": 8440 }, { "contrastive_loss": 3.906982421875, "epoch": 1.000592768227623, "mse_loss": 0.08269017189741135, "step": 8440 }, { "epoch": 1.001778304682869, "grad_norm": 0.376953125, "learning_rate": 0.0001983136684016318, "loss": 0.867, "step": 8450 }, { "contrastive_loss": 4.0753173828125, "epoch": 1.001778304682869, "mse_loss": 0.06675488501787186, "step": 8450 }, { "epoch": 1.002963841138115, "grad_norm": 0.50390625, "learning_rate": 0.00019830610065856038, "loss": 0.8592, "step": 8460 }, { "contrastive_loss": 4.0546875, "epoch": 1.002963841138115, "mse_loss": 0.07360005378723145, "step": 8460 }, { "epoch": 1.004149377593361, "grad_norm": 0.466796875, "learning_rate": 0.00019829851611766506, "loss": 0.8597, "step": 8470 }, { "contrastive_loss": 3.9478759765625, "epoch": 1.004149377593361, "mse_loss": 0.05581342428922653, "step": 8470 }, { "epoch": 1.005334914048607, "grad_norm": 0.546875, "learning_rate": 0.00019829091478024176, "loss": 0.8655, "step": 8480 }, { "contrastive_loss": 4.01708984375, "epoch": 1.005334914048607, "mse_loss": 0.0683521032333374, "step": 8480 }, { "epoch": 1.006520450503853, "grad_norm": 0.40625, "learning_rate": 0.0001982832966475894, "loss": 0.8748, "step": 8490 }, { "contrastive_loss": 3.890625, "epoch": 1.006520450503853, "mse_loss": 0.062373239547014236, "step": 8490 }, { "epoch": 1.007705986959099, "grad_norm": 0.498046875, "learning_rate": 0.0001982756617210097, "loss": 0.85, "step": 8500 }, { "contrastive_loss": 4.0091552734375, "epoch": 1.007705986959099, "mse_loss": 0.0871616080403328, "step": 8500 }, { "epoch": 1.008891523414345, "grad_norm": 0.61328125, "learning_rate": 0.00019826801000180728, "loss": 0.868, "step": 8510 }, { "contrastive_loss": 3.9095458984375, "epoch": 1.008891523414345, "mse_loss": 0.10950612276792526, "step": 8510 }, { "epoch": 1.010077059869591, "grad_norm": 0.4765625, "learning_rate": 0.00019826034149128958, "loss": 0.875, "step": 8520 }, { "contrastive_loss": 3.9493408203125, "epoch": 1.010077059869591, "mse_loss": 0.07874538749456406, "step": 8520 }, { "epoch": 1.011262596324837, "grad_norm": 0.5390625, "learning_rate": 0.00019825265619076695, "loss": 0.873, "step": 8530 }, { "contrastive_loss": 3.935546875, "epoch": 1.011262596324837, "mse_loss": 0.06725673377513885, "step": 8530 }, { "epoch": 1.012448132780083, "grad_norm": 0.48046875, "learning_rate": 0.00019824495410155257, "loss": 0.855, "step": 8540 }, { "contrastive_loss": 4.12939453125, "epoch": 1.012448132780083, "mse_loss": 0.08701753616333008, "step": 8540 }, { "epoch": 1.013633669235329, "grad_norm": 0.51953125, "learning_rate": 0.00019823723522496253, "loss": 0.861, "step": 8550 }, { "contrastive_loss": 4.00390625, "epoch": 1.013633669235329, "mse_loss": 0.059956200420856476, "step": 8550 }, { "epoch": 1.014819205690575, "grad_norm": 0.455078125, "learning_rate": 0.0001982294995623158, "loss": 0.8727, "step": 8560 }, { "contrastive_loss": 4.006103515625, "epoch": 1.014819205690575, "mse_loss": 0.07858453691005707, "step": 8560 }, { "epoch": 1.016004742145821, "grad_norm": 0.5, "learning_rate": 0.00019822174711493418, "loss": 0.8666, "step": 8570 }, { "contrastive_loss": 3.8958740234375, "epoch": 1.016004742145821, "mse_loss": 0.0699772983789444, "step": 8570 }, { "epoch": 1.017190278601067, "grad_norm": 0.515625, "learning_rate": 0.00019821397788414235, "loss": 0.8607, "step": 8580 }, { "contrastive_loss": 3.943603515625, "epoch": 1.017190278601067, "mse_loss": 0.08914261311292648, "step": 8580 }, { "epoch": 1.018375815056313, "grad_norm": 0.494140625, "learning_rate": 0.00019820619187126785, "loss": 0.8656, "step": 8590 }, { "contrastive_loss": 4.1441650390625, "epoch": 1.018375815056313, "mse_loss": 0.10151201486587524, "step": 8590 }, { "epoch": 1.019561351511559, "grad_norm": 0.41015625, "learning_rate": 0.00019819838907764113, "loss": 0.8799, "step": 8600 }, { "contrastive_loss": 3.9915771484375, "epoch": 1.019561351511559, "mse_loss": 0.06978797912597656, "step": 8600 }, { "epoch": 1.020746887966805, "grad_norm": 0.5390625, "learning_rate": 0.0001981905695045954, "loss": 0.8657, "step": 8610 }, { "contrastive_loss": 3.917236328125, "epoch": 1.020746887966805, "mse_loss": 0.05693100020289421, "step": 8610 }, { "epoch": 1.021932424422051, "grad_norm": 0.58203125, "learning_rate": 0.00019818273315346693, "loss": 0.8746, "step": 8620 }, { "contrastive_loss": 3.843505859375, "epoch": 1.021932424422051, "mse_loss": 0.06346254050731659, "step": 8620 }, { "epoch": 1.023117960877297, "grad_norm": 0.60546875, "learning_rate": 0.00019817488002559462, "loss": 0.8525, "step": 8630 }, { "contrastive_loss": 4.0167236328125, "epoch": 1.023117960877297, "mse_loss": 0.07413525134325027, "step": 8630 }, { "epoch": 1.024303497332543, "grad_norm": 0.482421875, "learning_rate": 0.0001981670101223204, "loss": 0.8725, "step": 8640 }, { "contrastive_loss": 3.8690185546875, "epoch": 1.024303497332543, "mse_loss": 0.06666528433561325, "step": 8640 }, { "epoch": 1.0254890337877889, "grad_norm": 0.51953125, "learning_rate": 0.000198159123444989, "loss": 0.86, "step": 8650 }, { "contrastive_loss": 3.9876708984375, "epoch": 1.0254890337877889, "mse_loss": 0.05867250636219978, "step": 8650 }, { "epoch": 1.0266745702430349, "grad_norm": 0.5078125, "learning_rate": 0.0001981512199949481, "loss": 0.8653, "step": 8660 }, { "contrastive_loss": 4.1063232421875, "epoch": 1.0266745702430349, "mse_loss": 0.09512174129486084, "step": 8660 }, { "epoch": 1.0278601066982809, "grad_norm": 0.4609375, "learning_rate": 0.00019814329977354815, "loss": 0.8567, "step": 8670 }, { "contrastive_loss": 3.9156494140625, "epoch": 1.0278601066982809, "mse_loss": 0.0715278908610344, "step": 8670 }, { "epoch": 1.0290456431535269, "grad_norm": 0.48046875, "learning_rate": 0.0001981353627821425, "loss": 0.8621, "step": 8680 }, { "contrastive_loss": 3.9451904296875, "epoch": 1.0290456431535269, "mse_loss": 0.06491746008396149, "step": 8680 }, { "epoch": 1.0302311796087729, "grad_norm": 0.57421875, "learning_rate": 0.00019812740902208734, "loss": 0.8695, "step": 8690 }, { "contrastive_loss": 3.901123046875, "epoch": 1.0302311796087729, "mse_loss": 0.060728464275598526, "step": 8690 }, { "epoch": 1.0314167160640189, "grad_norm": 0.5078125, "learning_rate": 0.00019811943849474176, "loss": 0.8635, "step": 8700 }, { "contrastive_loss": 3.9183349609375, "epoch": 1.0314167160640189, "mse_loss": 0.07017166167497635, "step": 8700 }, { "epoch": 1.032602252519265, "grad_norm": 0.53515625, "learning_rate": 0.00019811145120146774, "loss": 0.8669, "step": 8710 }, { "contrastive_loss": 3.9696044921875, "epoch": 1.032602252519265, "mse_loss": 0.0635877326130867, "step": 8710 }, { "epoch": 1.033787788974511, "grad_norm": 0.4375, "learning_rate": 0.00019810344714363002, "loss": 0.8647, "step": 8720 }, { "contrastive_loss": 3.985107421875, "epoch": 1.033787788974511, "mse_loss": 0.07548292726278305, "step": 8720 }, { "epoch": 1.034973325429757, "grad_norm": 0.49609375, "learning_rate": 0.00019809542632259633, "loss": 0.8705, "step": 8730 }, { "contrastive_loss": 3.962646484375, "epoch": 1.034973325429757, "mse_loss": 0.06218055263161659, "step": 8730 }, { "epoch": 1.036158861885003, "grad_norm": 0.466796875, "learning_rate": 0.00019808738873973723, "loss": 0.8611, "step": 8740 }, { "contrastive_loss": 3.7939453125, "epoch": 1.036158861885003, "mse_loss": 0.06368984282016754, "step": 8740 }, { "epoch": 1.037344398340249, "grad_norm": 0.578125, "learning_rate": 0.00019807933439642606, "loss": 0.8652, "step": 8750 }, { "contrastive_loss": 4.0142822265625, "epoch": 1.037344398340249, "mse_loss": 0.06598328799009323, "step": 8750 }, { "epoch": 1.038529934795495, "grad_norm": 0.416015625, "learning_rate": 0.00019807126329403913, "loss": 0.8693, "step": 8760 }, { "contrastive_loss": 3.9949951171875, "epoch": 1.038529934795495, "mse_loss": 0.09755360335111618, "step": 8760 }, { "epoch": 1.039715471250741, "grad_norm": 0.400390625, "learning_rate": 0.00019806317543395556, "loss": 0.85, "step": 8770 }, { "contrastive_loss": 3.9578857421875, "epoch": 1.039715471250741, "mse_loss": 0.07490207254886627, "step": 8770 }, { "epoch": 1.040901007705987, "grad_norm": 0.5390625, "learning_rate": 0.00019805507081755734, "loss": 0.8517, "step": 8780 }, { "contrastive_loss": 3.9232177734375, "epoch": 1.040901007705987, "mse_loss": 0.09288696944713593, "step": 8780 }, { "epoch": 1.042086544161233, "grad_norm": 0.44921875, "learning_rate": 0.00019804694944622933, "loss": 0.8693, "step": 8790 }, { "contrastive_loss": 3.8006591796875, "epoch": 1.042086544161233, "mse_loss": 0.08406596630811691, "step": 8790 }, { "epoch": 1.043272080616479, "grad_norm": 0.478515625, "learning_rate": 0.00019803881132135923, "loss": 0.8639, "step": 8800 }, { "contrastive_loss": 3.92578125, "epoch": 1.043272080616479, "mse_loss": 0.09738080948591232, "step": 8800 }, { "epoch": 1.044457617071725, "grad_norm": 0.5625, "learning_rate": 0.00019803065644433766, "loss": 0.8671, "step": 8810 }, { "contrastive_loss": 3.817138671875, "epoch": 1.044457617071725, "mse_loss": 0.05896385386586189, "step": 8810 }, { "epoch": 1.045643153526971, "grad_norm": 0.6015625, "learning_rate": 0.00019802248481655808, "loss": 0.8627, "step": 8820 }, { "contrastive_loss": 4.0087890625, "epoch": 1.045643153526971, "mse_loss": 0.0712377205491066, "step": 8820 }, { "epoch": 1.046828689982217, "grad_norm": 0.49609375, "learning_rate": 0.0001980142964394167, "loss": 0.8609, "step": 8830 }, { "contrastive_loss": 3.9722900390625, "epoch": 1.046828689982217, "mse_loss": 0.0794239491224289, "step": 8830 }, { "epoch": 1.048014226437463, "grad_norm": 0.455078125, "learning_rate": 0.00019800609131431283, "loss": 0.8623, "step": 8840 }, { "contrastive_loss": 3.8717041015625, "epoch": 1.048014226437463, "mse_loss": 0.0702713131904602, "step": 8840 }, { "epoch": 1.049199762892709, "grad_norm": 0.43359375, "learning_rate": 0.00019799786944264838, "loss": 0.8636, "step": 8850 }, { "contrastive_loss": 3.82861328125, "epoch": 1.049199762892709, "mse_loss": 0.052694499492645264, "step": 8850 }, { "epoch": 1.050385299347955, "grad_norm": 0.494140625, "learning_rate": 0.0001979896308258283, "loss": 0.8666, "step": 8860 }, { "contrastive_loss": 3.97314453125, "epoch": 1.050385299347955, "mse_loss": 0.06748475879430771, "step": 8860 }, { "epoch": 1.051570835803201, "grad_norm": 0.5859375, "learning_rate": 0.00019798137546526032, "loss": 0.8616, "step": 8870 }, { "contrastive_loss": 4.020263671875, "epoch": 1.051570835803201, "mse_loss": 0.060842812061309814, "step": 8870 }, { "epoch": 1.052756372258447, "grad_norm": 0.41796875, "learning_rate": 0.00019797310336235508, "loss": 0.8631, "step": 8880 }, { "contrastive_loss": 3.9136962890625, "epoch": 1.052756372258447, "mse_loss": 0.06565424054861069, "step": 8880 }, { "epoch": 1.053941908713693, "grad_norm": 0.49609375, "learning_rate": 0.00019796481451852605, "loss": 0.8594, "step": 8890 }, { "contrastive_loss": 3.947998046875, "epoch": 1.053941908713693, "mse_loss": 0.06932934373617172, "step": 8890 }, { "epoch": 1.055127445168939, "grad_norm": 0.453125, "learning_rate": 0.00019795650893518956, "loss": 0.8788, "step": 8900 }, { "contrastive_loss": 3.9283447265625, "epoch": 1.055127445168939, "mse_loss": 0.06483492255210876, "step": 8900 }, { "epoch": 1.056312981624185, "grad_norm": 0.55078125, "learning_rate": 0.00019794818661376482, "loss": 0.8619, "step": 8910 }, { "contrastive_loss": 4.031494140625, "epoch": 1.056312981624185, "mse_loss": 0.0609988234937191, "step": 8910 }, { "epoch": 1.057498518079431, "grad_norm": 0.416015625, "learning_rate": 0.00019793984755567384, "loss": 0.8574, "step": 8920 }, { "contrastive_loss": 4.0665283203125, "epoch": 1.057498518079431, "mse_loss": 0.08827183395624161, "step": 8920 }, { "epoch": 1.058684054534677, "grad_norm": 0.494140625, "learning_rate": 0.0001979314917623416, "loss": 0.8781, "step": 8930 }, { "contrastive_loss": 4.008544921875, "epoch": 1.058684054534677, "mse_loss": 0.06919556111097336, "step": 8930 }, { "epoch": 1.059869590989923, "grad_norm": 0.55078125, "learning_rate": 0.00019792311923519585, "loss": 0.8717, "step": 8940 }, { "contrastive_loss": 3.923095703125, "epoch": 1.059869590989923, "mse_loss": 0.06794121116399765, "step": 8940 }, { "epoch": 1.061055127445169, "grad_norm": 0.4296875, "learning_rate": 0.00019791472997566722, "loss": 0.8632, "step": 8950 }, { "contrastive_loss": 3.939208984375, "epoch": 1.061055127445169, "mse_loss": 0.0814274474978447, "step": 8950 }, { "epoch": 1.062240663900415, "grad_norm": 0.5625, "learning_rate": 0.00019790632398518923, "loss": 0.8709, "step": 8960 }, { "contrastive_loss": 4.01025390625, "epoch": 1.062240663900415, "mse_loss": 0.10177548974752426, "step": 8960 }, { "epoch": 1.063426200355661, "grad_norm": 0.54296875, "learning_rate": 0.00019789790126519818, "loss": 0.8547, "step": 8970 }, { "contrastive_loss": 3.9544677734375, "epoch": 1.063426200355661, "mse_loss": 0.06780659407377243, "step": 8970 }, { "epoch": 1.064611736810907, "grad_norm": 0.462890625, "learning_rate": 0.00019788946181713334, "loss": 0.8706, "step": 8980 }, { "contrastive_loss": 4.10986328125, "epoch": 1.064611736810907, "mse_loss": 0.06323032081127167, "step": 8980 }, { "epoch": 1.065797273266153, "grad_norm": 0.5078125, "learning_rate": 0.00019788100564243678, "loss": 0.8743, "step": 8990 }, { "contrastive_loss": 3.9852294921875, "epoch": 1.065797273266153, "mse_loss": 0.1051546186208725, "step": 8990 }, { "epoch": 1.066982809721399, "grad_norm": 0.47265625, "learning_rate": 0.00019787253274255337, "loss": 0.8789, "step": 9000 }, { "contrastive_loss": 3.9757080078125, "epoch": 1.066982809721399, "mse_loss": 0.061903417110443115, "step": 9000 }, { "epoch": 1.068168346176645, "grad_norm": 0.49609375, "learning_rate": 0.0001978640431189309, "loss": 0.8679, "step": 9010 }, { "contrastive_loss": 3.9761962890625, "epoch": 1.068168346176645, "mse_loss": 0.08964681625366211, "step": 9010 }, { "epoch": 1.069353882631891, "grad_norm": 0.515625, "learning_rate": 0.0001978555367730201, "loss": 0.8669, "step": 9020 }, { "contrastive_loss": 4.0439453125, "epoch": 1.069353882631891, "mse_loss": 0.07351652532815933, "step": 9020 }, { "epoch": 1.070539419087137, "grad_norm": 0.494140625, "learning_rate": 0.00019784701370627444, "loss": 0.8548, "step": 9030 }, { "contrastive_loss": 3.875244140625, "epoch": 1.070539419087137, "mse_loss": 0.08312033116817474, "step": 9030 }, { "epoch": 1.071724955542383, "grad_norm": 0.408203125, "learning_rate": 0.00019783847392015026, "loss": 0.8563, "step": 9040 }, { "contrastive_loss": 3.934326171875, "epoch": 1.071724955542383, "mse_loss": 0.0652485117316246, "step": 9040 }, { "epoch": 1.072910491997629, "grad_norm": 0.4296875, "learning_rate": 0.0001978299174161067, "loss": 0.8637, "step": 9050 }, { "contrastive_loss": 4.0111083984375, "epoch": 1.072910491997629, "mse_loss": 0.050065845251083374, "step": 9050 }, { "epoch": 1.0740960284528749, "grad_norm": 0.5234375, "learning_rate": 0.00019782134419560595, "loss": 0.857, "step": 9060 }, { "contrastive_loss": 3.979736328125, "epoch": 1.0740960284528749, "mse_loss": 0.09129093587398529, "step": 9060 }, { "epoch": 1.0752815649081209, "grad_norm": 0.58984375, "learning_rate": 0.00019781275426011293, "loss": 0.8567, "step": 9070 }, { "contrastive_loss": 3.9449462890625, "epoch": 1.0752815649081209, "mse_loss": 0.08329880982637405, "step": 9070 }, { "epoch": 1.0764671013633669, "grad_norm": 0.53125, "learning_rate": 0.00019780414761109535, "loss": 0.8589, "step": 9080 }, { "contrastive_loss": 3.946533203125, "epoch": 1.0764671013633669, "mse_loss": 0.05310998111963272, "step": 9080 }, { "epoch": 1.0776526378186129, "grad_norm": 0.3671875, "learning_rate": 0.0001977955242500239, "loss": 0.8543, "step": 9090 }, { "contrastive_loss": 3.9183349609375, "epoch": 1.0776526378186129, "mse_loss": 0.06290769577026367, "step": 9090 }, { "epoch": 1.0788381742738589, "grad_norm": 0.51953125, "learning_rate": 0.0001977868841783721, "loss": 0.8586, "step": 9100 }, { "contrastive_loss": 3.847900390625, "epoch": 1.0788381742738589, "mse_loss": 0.09638501703739166, "step": 9100 }, { "epoch": 1.0800237107291049, "grad_norm": 0.447265625, "learning_rate": 0.00019777822739761624, "loss": 0.8591, "step": 9110 }, { "contrastive_loss": 3.967529296875, "epoch": 1.0800237107291049, "mse_loss": 0.08624906092882156, "step": 9110 }, { "epoch": 1.0812092471843509, "grad_norm": 0.83984375, "learning_rate": 0.00019776955390923555, "loss": 0.8599, "step": 9120 }, { "contrastive_loss": 3.8092041015625, "epoch": 1.0812092471843509, "mse_loss": 0.05354497581720352, "step": 9120 }, { "epoch": 1.0823947836395968, "grad_norm": 0.51171875, "learning_rate": 0.00019776086371471214, "loss": 0.864, "step": 9130 }, { "contrastive_loss": 3.83056640625, "epoch": 1.0823947836395968, "mse_loss": 0.09898357838392258, "step": 9130 }, { "epoch": 1.0835803200948428, "grad_norm": 0.412109375, "learning_rate": 0.00019775215681553084, "loss": 0.8707, "step": 9140 }, { "contrastive_loss": 3.9864501953125, "epoch": 1.0835803200948428, "mse_loss": 0.06168525293469429, "step": 9140 }, { "epoch": 1.0847658565500888, "grad_norm": 0.396484375, "learning_rate": 0.0001977434332131795, "loss": 0.8642, "step": 9150 }, { "contrastive_loss": 3.895263671875, "epoch": 1.0847658565500888, "mse_loss": 0.07881630957126617, "step": 9150 }, { "epoch": 1.0859513930053348, "grad_norm": 0.5, "learning_rate": 0.0001977346929091487, "loss": 0.8698, "step": 9160 }, { "contrastive_loss": 3.9422607421875, "epoch": 1.0859513930053348, "mse_loss": 0.06276098638772964, "step": 9160 }, { "epoch": 1.0871369294605808, "grad_norm": 0.51171875, "learning_rate": 0.00019772593590493194, "loss": 0.87, "step": 9170 }, { "contrastive_loss": 3.876708984375, "epoch": 1.0871369294605808, "mse_loss": 0.09912709891796112, "step": 9170 }, { "epoch": 1.0883224659158268, "grad_norm": 0.515625, "learning_rate": 0.00019771716220202552, "loss": 0.8703, "step": 9180 }, { "contrastive_loss": 4.0076904296875, "epoch": 1.0883224659158268, "mse_loss": 0.08639240264892578, "step": 9180 }, { "epoch": 1.0895080023710728, "grad_norm": 0.765625, "learning_rate": 0.00019770837180192868, "loss": 0.8694, "step": 9190 }, { "contrastive_loss": 3.98779296875, "epoch": 1.0895080023710728, "mse_loss": 0.07268990576267242, "step": 9190 }, { "epoch": 1.0906935388263188, "grad_norm": 0.60546875, "learning_rate": 0.0001976995647061434, "loss": 0.876, "step": 9200 }, { "contrastive_loss": 3.9224853515625, "epoch": 1.0906935388263188, "mse_loss": 0.07778716087341309, "step": 9200 }, { "epoch": 1.091879075281565, "grad_norm": 0.5, "learning_rate": 0.00019769074091617464, "loss": 0.8743, "step": 9210 }, { "contrastive_loss": 3.962158203125, "epoch": 1.091879075281565, "mse_loss": 0.10310284048318863, "step": 9210 }, { "epoch": 1.093064611736811, "grad_norm": 0.5078125, "learning_rate": 0.00019768190043353005, "loss": 0.8697, "step": 9220 }, { "contrastive_loss": 3.8890380859375, "epoch": 1.093064611736811, "mse_loss": 0.08942709118127823, "step": 9220 }, { "epoch": 1.094250148192057, "grad_norm": 0.4453125, "learning_rate": 0.00019767304325972034, "loss": 0.8625, "step": 9230 }, { "contrastive_loss": 4.0179443359375, "epoch": 1.094250148192057, "mse_loss": 0.0669834166765213, "step": 9230 }, { "epoch": 1.095435684647303, "grad_norm": 0.62109375, "learning_rate": 0.00019766416939625886, "loss": 0.8622, "step": 9240 }, { "contrastive_loss": 3.9520263671875, "epoch": 1.095435684647303, "mse_loss": 0.06712881475687027, "step": 9240 }, { "epoch": 1.096621221102549, "grad_norm": 0.4453125, "learning_rate": 0.00019765527884466196, "loss": 0.8761, "step": 9250 }, { "contrastive_loss": 4.0595703125, "epoch": 1.096621221102549, "mse_loss": 0.07299090921878815, "step": 9250 }, { "epoch": 1.097806757557795, "grad_norm": 0.34375, "learning_rate": 0.00019764637160644882, "loss": 0.8593, "step": 9260 }, { "contrastive_loss": 4.1580810546875, "epoch": 1.097806757557795, "mse_loss": 0.0881153866648674, "step": 9260 }, { "epoch": 1.098992294013041, "grad_norm": 0.482421875, "learning_rate": 0.00019763744768314134, "loss": 0.867, "step": 9270 }, { "contrastive_loss": 3.9298095703125, "epoch": 1.098992294013041, "mse_loss": 0.05513034015893936, "step": 9270 }, { "epoch": 1.100177830468287, "grad_norm": 0.50390625, "learning_rate": 0.0001976285070762645, "loss": 0.8555, "step": 9280 }, { "contrastive_loss": 4.00634765625, "epoch": 1.100177830468287, "mse_loss": 0.09224486351013184, "step": 9280 }, { "epoch": 1.101363366923533, "grad_norm": 0.5, "learning_rate": 0.00019761954978734592, "loss": 0.8661, "step": 9290 }, { "contrastive_loss": 3.9283447265625, "epoch": 1.101363366923533, "mse_loss": 0.07812736928462982, "step": 9290 }, { "epoch": 1.102548903378779, "grad_norm": 0.474609375, "learning_rate": 0.0001976105758179162, "loss": 0.8638, "step": 9300 }, { "contrastive_loss": 3.857421875, "epoch": 1.102548903378779, "mse_loss": 0.07832378149032593, "step": 9300 }, { "epoch": 1.103734439834025, "grad_norm": 0.48046875, "learning_rate": 0.00019760158516950868, "loss": 0.8729, "step": 9310 }, { "contrastive_loss": 3.8914794921875, "epoch": 1.103734439834025, "mse_loss": 0.09383363276720047, "step": 9310 }, { "epoch": 1.104919976289271, "grad_norm": 0.435546875, "learning_rate": 0.0001975925778436597, "loss": 0.8668, "step": 9320 }, { "contrastive_loss": 3.8406982421875, "epoch": 1.104919976289271, "mse_loss": 0.07364105433225632, "step": 9320 }, { "epoch": 1.106105512744517, "grad_norm": 0.412109375, "learning_rate": 0.00019758355384190832, "loss": 0.8548, "step": 9330 }, { "contrastive_loss": 3.81787109375, "epoch": 1.106105512744517, "mse_loss": 0.07221700996160507, "step": 9330 }, { "epoch": 1.107291049199763, "grad_norm": 0.78125, "learning_rate": 0.0001975745131657965, "loss": 0.8737, "step": 9340 }, { "contrastive_loss": 3.8194580078125, "epoch": 1.107291049199763, "mse_loss": 0.08374866098165512, "step": 9340 }, { "epoch": 1.108476585655009, "grad_norm": 0.53125, "learning_rate": 0.00019756545581686908, "loss": 0.8631, "step": 9350 }, { "contrastive_loss": 3.967529296875, "epoch": 1.108476585655009, "mse_loss": 0.07167395204305649, "step": 9350 }, { "epoch": 1.109662122110255, "grad_norm": 0.55078125, "learning_rate": 0.00019755638179667364, "loss": 0.8697, "step": 9360 }, { "contrastive_loss": 3.921875, "epoch": 1.109662122110255, "mse_loss": 0.08363322913646698, "step": 9360 }, { "epoch": 1.110847658565501, "grad_norm": 0.53515625, "learning_rate": 0.00019754729110676075, "loss": 0.8634, "step": 9370 }, { "contrastive_loss": 4.0596923828125, "epoch": 1.110847658565501, "mse_loss": 0.08625786751508713, "step": 9370 }, { "epoch": 1.112033195020747, "grad_norm": 0.5546875, "learning_rate": 0.00019753818374868373, "loss": 0.8729, "step": 9380 }, { "contrastive_loss": 4.0391845703125, "epoch": 1.112033195020747, "mse_loss": 0.06321946531534195, "step": 9380 }, { "epoch": 1.113218731475993, "grad_norm": 0.466796875, "learning_rate": 0.00019752905972399878, "loss": 0.8649, "step": 9390 }, { "contrastive_loss": 3.826171875, "epoch": 1.113218731475993, "mse_loss": 0.08010145276784897, "step": 9390 }, { "epoch": 1.114404267931239, "grad_norm": 0.486328125, "learning_rate": 0.00019751991903426495, "loss": 0.8489, "step": 9400 }, { "contrastive_loss": 3.9385986328125, "epoch": 1.114404267931239, "mse_loss": 0.06877348572015762, "step": 9400 }, { "epoch": 1.115589804386485, "grad_norm": 0.49609375, "learning_rate": 0.00019751076168104414, "loss": 0.864, "step": 9410 }, { "contrastive_loss": 3.9093017578125, "epoch": 1.115589804386485, "mse_loss": 0.11837724596261978, "step": 9410 }, { "epoch": 1.116775340841731, "grad_norm": 0.65234375, "learning_rate": 0.00019750158766590107, "loss": 0.8721, "step": 9420 }, { "contrastive_loss": 3.9447021484375, "epoch": 1.116775340841731, "mse_loss": 0.08067517727613449, "step": 9420 }, { "epoch": 1.117960877296977, "grad_norm": 0.64453125, "learning_rate": 0.00019749239699040335, "loss": 0.8637, "step": 9430 }, { "contrastive_loss": 4.030517578125, "epoch": 1.117960877296977, "mse_loss": 0.06876630336046219, "step": 9430 }, { "epoch": 1.119146413752223, "grad_norm": 0.53125, "learning_rate": 0.00019748318965612138, "loss": 0.8772, "step": 9440 }, { "contrastive_loss": 3.8358154296875, "epoch": 1.119146413752223, "mse_loss": 0.06755845993757248, "step": 9440 }, { "epoch": 1.120331950207469, "grad_norm": 0.5234375, "learning_rate": 0.0001974739656646285, "loss": 0.8572, "step": 9450 }, { "contrastive_loss": 4.0103759765625, "epoch": 1.120331950207469, "mse_loss": 0.05699676275253296, "step": 9450 }, { "epoch": 1.121517486662715, "grad_norm": 0.69140625, "learning_rate": 0.0001974647250175008, "loss": 0.8655, "step": 9460 }, { "contrastive_loss": 4.0224609375, "epoch": 1.121517486662715, "mse_loss": 0.08045870810747147, "step": 9460 }, { "epoch": 1.1227030231179609, "grad_norm": 0.51171875, "learning_rate": 0.00019745546771631725, "loss": 0.8696, "step": 9470 }, { "contrastive_loss": 3.8179931640625, "epoch": 1.1227030231179609, "mse_loss": 0.07328999042510986, "step": 9470 }, { "epoch": 1.1238885595732069, "grad_norm": 0.439453125, "learning_rate": 0.00019744619376265972, "loss": 0.8643, "step": 9480 }, { "contrastive_loss": 3.94775390625, "epoch": 1.1238885595732069, "mse_loss": 0.06027641519904137, "step": 9480 }, { "epoch": 1.1250740960284529, "grad_norm": 0.62890625, "learning_rate": 0.00019743690315811278, "loss": 0.8664, "step": 9490 }, { "contrastive_loss": 3.88818359375, "epoch": 1.1250740960284529, "mse_loss": 0.0668400451540947, "step": 9490 }, { "epoch": 1.1262596324836989, "grad_norm": 0.55859375, "learning_rate": 0.00019742759590426402, "loss": 0.8667, "step": 9500 }, { "contrastive_loss": 3.9678955078125, "epoch": 1.1262596324836989, "mse_loss": 0.07877247780561447, "step": 9500 }, { "epoch": 1.1274451689389449, "grad_norm": 0.376953125, "learning_rate": 0.0001974182720027038, "loss": 0.8755, "step": 9510 }, { "contrastive_loss": 3.9603271484375, "epoch": 1.1274451689389449, "mse_loss": 0.11377500742673874, "step": 9510 }, { "epoch": 1.1286307053941909, "grad_norm": 0.427734375, "learning_rate": 0.00019740893145502524, "loss": 0.8724, "step": 9520 }, { "contrastive_loss": 3.96923828125, "epoch": 1.1286307053941909, "mse_loss": 0.07901100069284439, "step": 9520 }, { "epoch": 1.1298162418494369, "grad_norm": 0.50390625, "learning_rate": 0.00019739957426282448, "loss": 0.8688, "step": 9530 }, { "contrastive_loss": 3.8804931640625, "epoch": 1.1298162418494369, "mse_loss": 0.053156811743974686, "step": 9530 }, { "epoch": 1.1310017783046828, "grad_norm": 0.61328125, "learning_rate": 0.00019739020042770032, "loss": 0.8676, "step": 9540 }, { "contrastive_loss": 3.85791015625, "epoch": 1.1310017783046828, "mse_loss": 0.10695886611938477, "step": 9540 }, { "epoch": 1.1321873147599288, "grad_norm": 0.6171875, "learning_rate": 0.00019738080995125454, "loss": 0.8677, "step": 9550 }, { "contrastive_loss": 3.9688720703125, "epoch": 1.1321873147599288, "mse_loss": 0.06355512142181396, "step": 9550 }, { "epoch": 1.1333728512151748, "grad_norm": 0.44140625, "learning_rate": 0.00019737140283509173, "loss": 0.8705, "step": 9560 }, { "contrastive_loss": 3.829345703125, "epoch": 1.1333728512151748, "mse_loss": 0.07314269244670868, "step": 9560 }, { "epoch": 1.1345583876704208, "grad_norm": 0.57421875, "learning_rate": 0.0001973619790808193, "loss": 0.8642, "step": 9570 }, { "contrastive_loss": 4.01904296875, "epoch": 1.1345583876704208, "mse_loss": 0.06910908967256546, "step": 9570 }, { "epoch": 1.1357439241256668, "grad_norm": 0.416015625, "learning_rate": 0.0001973525386900475, "loss": 0.8673, "step": 9580 }, { "contrastive_loss": 4.08544921875, "epoch": 1.1357439241256668, "mse_loss": 0.08239389955997467, "step": 9580 }, { "epoch": 1.1369294605809128, "grad_norm": 0.46484375, "learning_rate": 0.0001973430816643894, "loss": 0.8584, "step": 9590 }, { "contrastive_loss": 4.0220947265625, "epoch": 1.1369294605809128, "mse_loss": 0.11347369849681854, "step": 9590 }, { "epoch": 1.1381149970361588, "grad_norm": 0.458984375, "learning_rate": 0.000197333608005461, "loss": 0.8721, "step": 9600 }, { "contrastive_loss": 3.94873046875, "epoch": 1.1381149970361588, "mse_loss": 0.060229089111089706, "step": 9600 }, { "epoch": 1.1393005334914048, "grad_norm": 0.58984375, "learning_rate": 0.00019732411771488105, "loss": 0.8681, "step": 9610 }, { "contrastive_loss": 3.968505859375, "epoch": 1.1393005334914048, "mse_loss": 0.06834784895181656, "step": 9610 }, { "epoch": 1.1404860699466508, "grad_norm": 0.435546875, "learning_rate": 0.00019731461079427126, "loss": 0.862, "step": 9620 }, { "contrastive_loss": 3.959716796875, "epoch": 1.1404860699466508, "mse_loss": 0.10072461515665054, "step": 9620 }, { "epoch": 1.1416716064018968, "grad_norm": 0.5234375, "learning_rate": 0.000197305087245256, "loss": 0.8601, "step": 9630 }, { "contrastive_loss": 3.927734375, "epoch": 1.1416716064018968, "mse_loss": 0.07434437423944473, "step": 9630 }, { "epoch": 1.1428571428571428, "grad_norm": 0.51953125, "learning_rate": 0.00019729554706946265, "loss": 0.8626, "step": 9640 }, { "contrastive_loss": 3.8779296875, "epoch": 1.1428571428571428, "mse_loss": 0.0580415204167366, "step": 9640 }, { "epoch": 1.1440426793123888, "grad_norm": 0.59765625, "learning_rate": 0.00019728599026852135, "loss": 0.8613, "step": 9650 }, { "contrastive_loss": 3.9447021484375, "epoch": 1.1440426793123888, "mse_loss": 0.05742090195417404, "step": 9650 }, { "epoch": 1.1452282157676348, "grad_norm": 0.5625, "learning_rate": 0.00019727641684406507, "loss": 0.8542, "step": 9660 }, { "contrastive_loss": 4.0096435546875, "epoch": 1.1452282157676348, "mse_loss": 0.06259285658597946, "step": 9660 }, { "epoch": 1.1464137522228808, "grad_norm": 0.6640625, "learning_rate": 0.00019726682679772965, "loss": 0.8686, "step": 9670 }, { "contrastive_loss": 3.925048828125, "epoch": 1.1464137522228808, "mse_loss": 0.07423656433820724, "step": 9670 }, { "epoch": 1.1475992886781268, "grad_norm": 0.451171875, "learning_rate": 0.0001972572201311538, "loss": 0.8683, "step": 9680 }, { "contrastive_loss": 3.89013671875, "epoch": 1.1475992886781268, "mse_loss": 0.06339267641305923, "step": 9680 }, { "epoch": 1.1487848251333728, "grad_norm": 0.447265625, "learning_rate": 0.00019724759684597906, "loss": 0.8604, "step": 9690 }, { "contrastive_loss": 3.9129638671875, "epoch": 1.1487848251333728, "mse_loss": 0.08840388804674149, "step": 9690 }, { "epoch": 1.1499703615886188, "grad_norm": 0.5, "learning_rate": 0.0001972379569438497, "loss": 0.8733, "step": 9700 }, { "contrastive_loss": 4.086181640625, "epoch": 1.1499703615886188, "mse_loss": 0.089033342897892, "step": 9700 }, { "epoch": 1.1511558980438648, "grad_norm": 0.353515625, "learning_rate": 0.000197228300426413, "loss": 0.8715, "step": 9710 }, { "contrastive_loss": 3.974365234375, "epoch": 1.1511558980438648, "mse_loss": 0.1077410951256752, "step": 9710 }, { "epoch": 1.1523414344991108, "grad_norm": 0.55078125, "learning_rate": 0.00019721862729531891, "loss": 0.8721, "step": 9720 }, { "contrastive_loss": 3.8897705078125, "epoch": 1.1523414344991108, "mse_loss": 0.07769681513309479, "step": 9720 }, { "epoch": 1.1535269709543567, "grad_norm": 0.40625, "learning_rate": 0.00019720893755222042, "loss": 0.8665, "step": 9730 }, { "contrastive_loss": 3.9735107421875, "epoch": 1.1535269709543567, "mse_loss": 0.0795193761587143, "step": 9730 }, { "epoch": 1.1547125074096027, "grad_norm": 0.404296875, "learning_rate": 0.0001971992311987731, "loss": 0.8565, "step": 9740 }, { "contrastive_loss": 3.961181640625, "epoch": 1.1547125074096027, "mse_loss": 0.06523869931697845, "step": 9740 }, { "epoch": 1.1558980438648487, "grad_norm": 0.4375, "learning_rate": 0.0001971895082366356, "loss": 0.8639, "step": 9750 }, { "contrastive_loss": 3.997314453125, "epoch": 1.1558980438648487, "mse_loss": 0.07033234089612961, "step": 9750 }, { "epoch": 1.1570835803200947, "grad_norm": 0.44140625, "learning_rate": 0.00019717976866746927, "loss": 0.8646, "step": 9760 }, { "contrastive_loss": 4.0447998046875, "epoch": 1.1570835803200947, "mse_loss": 0.06681958585977554, "step": 9760 }, { "epoch": 1.1582691167753407, "grad_norm": 0.435546875, "learning_rate": 0.00019717001249293836, "loss": 0.8632, "step": 9770 }, { "contrastive_loss": 3.98974609375, "epoch": 1.1582691167753407, "mse_loss": 0.1103617325425148, "step": 9770 }, { "epoch": 1.1594546532305867, "grad_norm": 0.482421875, "learning_rate": 0.00019716023971470993, "loss": 0.872, "step": 9780 }, { "contrastive_loss": 3.9647216796875, "epoch": 1.1594546532305867, "mse_loss": 0.07781173288822174, "step": 9780 }, { "epoch": 1.160640189685833, "grad_norm": 0.400390625, "learning_rate": 0.00019715045033445386, "loss": 0.8614, "step": 9790 }, { "contrastive_loss": 3.9156494140625, "epoch": 1.160640189685833, "mse_loss": 0.06770938634872437, "step": 9790 }, { "epoch": 1.161825726141079, "grad_norm": 0.5859375, "learning_rate": 0.0001971406443538429, "loss": 0.8577, "step": 9800 }, { "contrastive_loss": 3.8167724609375, "epoch": 1.161825726141079, "mse_loss": 0.09080253541469574, "step": 9800 }, { "epoch": 1.163011262596325, "grad_norm": 0.458984375, "learning_rate": 0.00019713082177455263, "loss": 0.8446, "step": 9810 }, { "contrastive_loss": 3.9124755859375, "epoch": 1.163011262596325, "mse_loss": 0.0783456563949585, "step": 9810 }, { "epoch": 1.164196799051571, "grad_norm": 0.439453125, "learning_rate": 0.00019712098259826145, "loss": 0.8576, "step": 9820 }, { "contrastive_loss": 3.943115234375, "epoch": 1.164196799051571, "mse_loss": 0.09961448609828949, "step": 9820 }, { "epoch": 1.165382335506817, "grad_norm": 0.5, "learning_rate": 0.0001971111268266506, "loss": 0.8758, "step": 9830 }, { "contrastive_loss": 3.931640625, "epoch": 1.165382335506817, "mse_loss": 0.06059694290161133, "step": 9830 }, { "epoch": 1.166567871962063, "grad_norm": 0.447265625, "learning_rate": 0.00019710125446140416, "loss": 0.8657, "step": 9840 }, { "contrastive_loss": 4.0406494140625, "epoch": 1.166567871962063, "mse_loss": 0.05418676882982254, "step": 9840 }, { "epoch": 1.167753408417309, "grad_norm": 0.494140625, "learning_rate": 0.00019709136550420908, "loss": 0.8726, "step": 9850 }, { "contrastive_loss": 3.942138671875, "epoch": 1.167753408417309, "mse_loss": 0.09361178427934647, "step": 9850 }, { "epoch": 1.168938944872555, "grad_norm": 0.6015625, "learning_rate": 0.00019708145995675508, "loss": 0.8678, "step": 9860 }, { "contrastive_loss": 3.921630859375, "epoch": 1.168938944872555, "mse_loss": 0.054911017417907715, "step": 9860 }, { "epoch": 1.170124481327801, "grad_norm": 0.4921875, "learning_rate": 0.00019707153782073475, "loss": 0.8631, "step": 9870 }, { "contrastive_loss": 3.9310302734375, "epoch": 1.170124481327801, "mse_loss": 0.06703201681375504, "step": 9870 }, { "epoch": 1.1713100177830469, "grad_norm": 0.427734375, "learning_rate": 0.00019706159909784355, "loss": 0.8504, "step": 9880 }, { "contrastive_loss": 3.8985595703125, "epoch": 1.1713100177830469, "mse_loss": 0.10117337852716446, "step": 9880 }, { "epoch": 1.1724955542382929, "grad_norm": 0.458984375, "learning_rate": 0.00019705164378977966, "loss": 0.8686, "step": 9890 }, { "contrastive_loss": 3.8226318359375, "epoch": 1.1724955542382929, "mse_loss": 0.07028210908174515, "step": 9890 }, { "epoch": 1.1736810906935389, "grad_norm": 0.53125, "learning_rate": 0.00019704167189824425, "loss": 0.8623, "step": 9900 }, { "contrastive_loss": 3.947998046875, "epoch": 1.1736810906935389, "mse_loss": 0.057774655520915985, "step": 9900 }, { "epoch": 1.1748666271487849, "grad_norm": 0.49609375, "learning_rate": 0.00019703168342494117, "loss": 0.8595, "step": 9910 }, { "contrastive_loss": 4.0489501953125, "epoch": 1.1748666271487849, "mse_loss": 0.09807863086462021, "step": 9910 }, { "epoch": 1.1760521636040309, "grad_norm": 0.478515625, "learning_rate": 0.00019702167837157725, "loss": 0.8718, "step": 9920 }, { "contrastive_loss": 4.001708984375, "epoch": 1.1760521636040309, "mse_loss": 0.06757157295942307, "step": 9920 }, { "epoch": 1.1772377000592769, "grad_norm": 0.53125, "learning_rate": 0.00019701165673986207, "loss": 0.8559, "step": 9930 }, { "contrastive_loss": 3.9053955078125, "epoch": 1.1772377000592769, "mse_loss": 0.09093797206878662, "step": 9930 }, { "epoch": 1.1784232365145229, "grad_norm": 0.478515625, "learning_rate": 0.00019700161853150795, "loss": 0.8702, "step": 9940 }, { "contrastive_loss": 3.950439453125, "epoch": 1.1784232365145229, "mse_loss": 0.07059450447559357, "step": 9940 }, { "epoch": 1.1796087729697688, "grad_norm": 0.56640625, "learning_rate": 0.0001969915637482303, "loss": 0.8665, "step": 9950 }, { "contrastive_loss": 3.88720703125, "epoch": 1.1796087729697688, "mse_loss": 0.07978158444166183, "step": 9950 }, { "epoch": 1.1807943094250148, "grad_norm": 0.6171875, "learning_rate": 0.00019698149239174708, "loss": 0.8607, "step": 9960 }, { "contrastive_loss": 3.834228515625, "epoch": 1.1807943094250148, "mse_loss": 0.05833267420530319, "step": 9960 }, { "epoch": 1.1819798458802608, "grad_norm": 0.52734375, "learning_rate": 0.00019697140446377928, "loss": 0.8666, "step": 9970 }, { "contrastive_loss": 3.8280029296875, "epoch": 1.1819798458802608, "mse_loss": 0.06952390819787979, "step": 9970 }, { "epoch": 1.1831653823355068, "grad_norm": 0.515625, "learning_rate": 0.00019696129996605062, "loss": 0.8472, "step": 9980 }, { "contrastive_loss": 4.033203125, "epoch": 1.1831653823355068, "mse_loss": 0.09965918958187103, "step": 9980 }, { "epoch": 1.1843509187907528, "grad_norm": 0.478515625, "learning_rate": 0.0001969511789002877, "loss": 0.8637, "step": 9990 }, { "contrastive_loss": 3.9669189453125, "epoch": 1.1843509187907528, "mse_loss": 0.06630059331655502, "step": 9990 }, { "epoch": 1.1855364552459988, "grad_norm": 0.453125, "learning_rate": 0.00019694104126821992, "loss": 0.8645, "step": 10000 }, { "contrastive_loss": 3.852294921875, "epoch": 1.1855364552459988, "mse_loss": 0.06723321229219437, "step": 10000 }, { "epoch": 1.1867219917012448, "grad_norm": 0.55078125, "learning_rate": 0.00019693088707157955, "loss": 0.8687, "step": 10010 }, { "contrastive_loss": 3.9278564453125, "epoch": 1.1867219917012448, "mse_loss": 0.06200822815299034, "step": 10010 }, { "epoch": 1.1879075281564908, "grad_norm": 0.51953125, "learning_rate": 0.00019692071631210163, "loss": 0.8596, "step": 10020 }, { "contrastive_loss": 3.9534912109375, "epoch": 1.1879075281564908, "mse_loss": 0.05843154713511467, "step": 10020 }, { "epoch": 1.1890930646117368, "grad_norm": 0.451171875, "learning_rate": 0.00019691052899152407, "loss": 0.8583, "step": 10030 }, { "contrastive_loss": 3.880859375, "epoch": 1.1890930646117368, "mse_loss": 0.0866873636841774, "step": 10030 }, { "epoch": 1.1902786010669828, "grad_norm": 0.47265625, "learning_rate": 0.00019690032511158765, "loss": 0.8601, "step": 10040 }, { "contrastive_loss": 3.9481201171875, "epoch": 1.1902786010669828, "mse_loss": 0.0672541931271553, "step": 10040 }, { "epoch": 1.1914641375222288, "grad_norm": 0.484375, "learning_rate": 0.00019689010467403587, "loss": 0.8623, "step": 10050 }, { "contrastive_loss": 4.0579833984375, "epoch": 1.1914641375222288, "mse_loss": 0.0956583172082901, "step": 10050 }, { "epoch": 1.1926496739774748, "grad_norm": 0.5859375, "learning_rate": 0.00019687986768061514, "loss": 0.866, "step": 10060 }, { "contrastive_loss": 4.0186767578125, "epoch": 1.1926496739774748, "mse_loss": 0.06326662749052048, "step": 10060 }, { "epoch": 1.1938352104327208, "grad_norm": 0.5625, "learning_rate": 0.00019686961413307473, "loss": 0.8526, "step": 10070 }, { "contrastive_loss": 3.879638671875, "epoch": 1.1938352104327208, "mse_loss": 0.09468957036733627, "step": 10070 }, { "epoch": 1.1950207468879668, "grad_norm": 0.4296875, "learning_rate": 0.0001968593440331666, "loss": 0.8638, "step": 10080 }, { "contrastive_loss": 3.9552001953125, "epoch": 1.1950207468879668, "mse_loss": 0.06441505253314972, "step": 10080 }, { "epoch": 1.1962062833432128, "grad_norm": 0.408203125, "learning_rate": 0.00019684905738264573, "loss": 0.8551, "step": 10090 }, { "contrastive_loss": 3.9361572265625, "epoch": 1.1962062833432128, "mse_loss": 0.061374109238386154, "step": 10090 }, { "epoch": 1.1973918197984588, "grad_norm": 0.451171875, "learning_rate": 0.00019683875418326978, "loss": 0.8651, "step": 10100 }, { "contrastive_loss": 3.8355712890625, "epoch": 1.1973918197984588, "mse_loss": 0.058961328119039536, "step": 10100 }, { "epoch": 1.1985773562537048, "grad_norm": 0.486328125, "learning_rate": 0.00019682843443679925, "loss": 0.8622, "step": 10110 }, { "contrastive_loss": 3.9822998046875, "epoch": 1.1985773562537048, "mse_loss": 0.06407319009304047, "step": 10110 }, { "epoch": 1.1997628927089508, "grad_norm": 0.419921875, "learning_rate": 0.00019681809814499758, "loss": 0.8592, "step": 10120 }, { "contrastive_loss": 4.0816650390625, "epoch": 1.1997628927089508, "mse_loss": 0.059373706579208374, "step": 10120 }, { "epoch": 1.2009484291641968, "grad_norm": 0.48828125, "learning_rate": 0.0001968077453096309, "loss": 0.8565, "step": 10130 }, { "contrastive_loss": 3.8001708984375, "epoch": 1.2009484291641968, "mse_loss": 0.07582296431064606, "step": 10130 }, { "epoch": 1.2021339656194427, "grad_norm": 0.482421875, "learning_rate": 0.00019679737593246823, "loss": 0.8571, "step": 10140 }, { "contrastive_loss": 3.9935302734375, "epoch": 1.2021339656194427, "mse_loss": 0.09069248288869858, "step": 10140 }, { "epoch": 1.2033195020746887, "grad_norm": 0.51171875, "learning_rate": 0.00019678699001528143, "loss": 0.8711, "step": 10150 }, { "contrastive_loss": 4.0087890625, "epoch": 1.2033195020746887, "mse_loss": 0.07643420249223709, "step": 10150 }, { "epoch": 1.2045050385299347, "grad_norm": 0.416015625, "learning_rate": 0.0001967765875598452, "loss": 0.8504, "step": 10160 }, { "contrastive_loss": 3.9188232421875, "epoch": 1.2045050385299347, "mse_loss": 0.0735216811299324, "step": 10160 }, { "epoch": 1.2056905749851807, "grad_norm": 0.60546875, "learning_rate": 0.00019676616856793697, "loss": 0.8627, "step": 10170 }, { "contrastive_loss": 3.88330078125, "epoch": 1.2056905749851807, "mse_loss": 0.08205975592136383, "step": 10170 }, { "epoch": 1.2068761114404267, "grad_norm": 0.546875, "learning_rate": 0.00019675573304133709, "loss": 0.8667, "step": 10180 }, { "contrastive_loss": 3.866455078125, "epoch": 1.2068761114404267, "mse_loss": 0.10390738397836685, "step": 10180 }, { "epoch": 1.2080616478956727, "grad_norm": 0.58203125, "learning_rate": 0.00019674528098182875, "loss": 0.8681, "step": 10190 }, { "contrastive_loss": 3.903564453125, "epoch": 1.2080616478956727, "mse_loss": 0.08018187433481216, "step": 10190 }, { "epoch": 1.2092471843509187, "grad_norm": 0.484375, "learning_rate": 0.00019673481239119786, "loss": 0.8567, "step": 10200 }, { "contrastive_loss": 3.8294677734375, "epoch": 1.2092471843509187, "mse_loss": 0.0756526067852974, "step": 10200 }, { "epoch": 1.2104327208061647, "grad_norm": 0.44921875, "learning_rate": 0.00019672432727123318, "loss": 0.8621, "step": 10210 }, { "contrastive_loss": 3.8665771484375, "epoch": 1.2104327208061647, "mse_loss": 0.0712173730134964, "step": 10210 }, { "epoch": 1.2116182572614107, "grad_norm": 0.44140625, "learning_rate": 0.00019671382562372645, "loss": 0.8517, "step": 10220 }, { "contrastive_loss": 3.9561767578125, "epoch": 1.2116182572614107, "mse_loss": 0.09817253053188324, "step": 10220 }, { "epoch": 1.2128037937166567, "grad_norm": 0.5625, "learning_rate": 0.000196703307450472, "loss": 0.8558, "step": 10230 }, { "contrastive_loss": 3.833984375, "epoch": 1.2128037937166567, "mse_loss": 0.0752829760313034, "step": 10230 }, { "epoch": 1.2139893301719027, "grad_norm": 0.494140625, "learning_rate": 0.0001966927727532672, "loss": 0.8487, "step": 10240 }, { "contrastive_loss": 4.0174560546875, "epoch": 1.2139893301719027, "mse_loss": 0.09386294335126877, "step": 10240 }, { "epoch": 1.215174866627149, "grad_norm": 0.56640625, "learning_rate": 0.00019668222153391204, "loss": 0.8663, "step": 10250 }, { "contrastive_loss": 3.912109375, "epoch": 1.215174866627149, "mse_loss": 0.060148414224386215, "step": 10250 }, { "epoch": 1.216360403082395, "grad_norm": 0.423828125, "learning_rate": 0.00019667165379420954, "loss": 0.8603, "step": 10260 }, { "contrastive_loss": 3.83251953125, "epoch": 1.216360403082395, "mse_loss": 0.10369767248630524, "step": 10260 }, { "epoch": 1.217545939537641, "grad_norm": 0.57421875, "learning_rate": 0.00019666106953596536, "loss": 0.86, "step": 10270 }, { "contrastive_loss": 3.8900146484375, "epoch": 1.217545939537641, "mse_loss": 0.0707135796546936, "step": 10270 }, { "epoch": 1.218731475992887, "grad_norm": 0.61328125, "learning_rate": 0.00019665046876098807, "loss": 0.8676, "step": 10280 }, { "contrastive_loss": 3.892333984375, "epoch": 1.218731475992887, "mse_loss": 0.08786596357822418, "step": 10280 }, { "epoch": 1.2199170124481329, "grad_norm": 0.5078125, "learning_rate": 0.00019663985147108908, "loss": 0.859, "step": 10290 }, { "contrastive_loss": 3.8228759765625, "epoch": 1.2199170124481329, "mse_loss": 0.09153902530670166, "step": 10290 }, { "epoch": 1.2211025489033789, "grad_norm": 0.55078125, "learning_rate": 0.00019662921766808256, "loss": 0.8645, "step": 10300 }, { "contrastive_loss": 3.90234375, "epoch": 1.2211025489033789, "mse_loss": 0.05634723976254463, "step": 10300 }, { "epoch": 1.2222880853586249, "grad_norm": 0.486328125, "learning_rate": 0.00019661856735378555, "loss": 0.8594, "step": 10310 }, { "contrastive_loss": 3.8857421875, "epoch": 1.2222880853586249, "mse_loss": 0.056584298610687256, "step": 10310 }, { "epoch": 1.2234736218138709, "grad_norm": 0.453125, "learning_rate": 0.00019660790053001792, "loss": 0.8566, "step": 10320 }, { "contrastive_loss": 3.9775390625, "epoch": 1.2234736218138709, "mse_loss": 0.07482162863016129, "step": 10320 }, { "epoch": 1.2246591582691169, "grad_norm": 0.39453125, "learning_rate": 0.0001965972171986023, "loss": 0.8592, "step": 10330 }, { "contrastive_loss": 3.954833984375, "epoch": 1.2246591582691169, "mse_loss": 0.07475212961435318, "step": 10330 }, { "epoch": 1.2258446947243629, "grad_norm": 0.625, "learning_rate": 0.00019658651736136423, "loss": 0.866, "step": 10340 }, { "contrastive_loss": 3.931396484375, "epoch": 1.2258446947243629, "mse_loss": 0.04863797873258591, "step": 10340 }, { "epoch": 1.2270302311796089, "grad_norm": 0.578125, "learning_rate": 0.000196575801020132, "loss": 0.8723, "step": 10350 }, { "contrastive_loss": 3.98193359375, "epoch": 1.2270302311796089, "mse_loss": 0.08562777191400528, "step": 10350 }, { "epoch": 1.2282157676348548, "grad_norm": 0.59375, "learning_rate": 0.0001965650681767367, "loss": 0.8639, "step": 10360 }, { "contrastive_loss": 3.8526611328125, "epoch": 1.2282157676348548, "mse_loss": 0.07610879838466644, "step": 10360 }, { "epoch": 1.2294013040901008, "grad_norm": 0.61328125, "learning_rate": 0.0001965543188330123, "loss": 0.8743, "step": 10370 }, { "contrastive_loss": 3.852783203125, "epoch": 1.2294013040901008, "mse_loss": 0.07065240293741226, "step": 10370 }, { "epoch": 1.2305868405453468, "grad_norm": 0.51953125, "learning_rate": 0.0001965435529907956, "loss": 0.8518, "step": 10380 }, { "contrastive_loss": 3.9415283203125, "epoch": 1.2305868405453468, "mse_loss": 0.08463016897439957, "step": 10380 }, { "epoch": 1.2317723770005928, "grad_norm": 0.486328125, "learning_rate": 0.00019653277065192617, "loss": 0.862, "step": 10390 }, { "contrastive_loss": 3.9814453125, "epoch": 1.2317723770005928, "mse_loss": 0.048170242458581924, "step": 10390 }, { "epoch": 1.2329579134558388, "grad_norm": 0.47265625, "learning_rate": 0.0001965219718182464, "loss": 0.8474, "step": 10400 }, { "contrastive_loss": 3.974609375, "epoch": 1.2329579134558388, "mse_loss": 0.07898871600627899, "step": 10400 }, { "epoch": 1.2341434499110848, "grad_norm": 0.3515625, "learning_rate": 0.0001965111564916015, "loss": 0.8622, "step": 10410 }, { "contrastive_loss": 3.8868408203125, "epoch": 1.2341434499110848, "mse_loss": 0.086009182035923, "step": 10410 }, { "epoch": 1.2353289863663308, "grad_norm": 0.357421875, "learning_rate": 0.0001965003246738396, "loss": 0.867, "step": 10420 }, { "contrastive_loss": 3.9422607421875, "epoch": 1.2353289863663308, "mse_loss": 0.06549055874347687, "step": 10420 }, { "epoch": 1.2365145228215768, "grad_norm": 0.57421875, "learning_rate": 0.00019648947636681147, "loss": 0.8504, "step": 10430 }, { "contrastive_loss": 3.9627685546875, "epoch": 1.2365145228215768, "mse_loss": 0.07638484984636307, "step": 10430 }, { "epoch": 1.2377000592768228, "grad_norm": 0.396484375, "learning_rate": 0.00019647861157237083, "loss": 0.8579, "step": 10440 }, { "contrastive_loss": 3.9781494140625, "epoch": 1.2377000592768228, "mse_loss": 0.09584438800811768, "step": 10440 }, { "epoch": 1.2388855957320688, "grad_norm": 0.44140625, "learning_rate": 0.00019646773029237418, "loss": 0.8635, "step": 10450 }, { "contrastive_loss": 4.025390625, "epoch": 1.2388855957320688, "mse_loss": 0.06907825171947479, "step": 10450 }, { "epoch": 1.2400711321873148, "grad_norm": 0.37109375, "learning_rate": 0.0001964568325286808, "loss": 0.8652, "step": 10460 }, { "contrastive_loss": 3.9420166015625, "epoch": 1.2400711321873148, "mse_loss": 0.06163986399769783, "step": 10460 }, { "epoch": 1.2412566686425608, "grad_norm": 0.37890625, "learning_rate": 0.00019644591828315284, "loss": 0.8576, "step": 10470 }, { "contrastive_loss": 3.9573974609375, "epoch": 1.2412566686425608, "mse_loss": 0.08600505441427231, "step": 10470 }, { "epoch": 1.2424422050978068, "grad_norm": 0.3984375, "learning_rate": 0.00019643498755765525, "loss": 0.8656, "step": 10480 }, { "contrastive_loss": 4.0101318359375, "epoch": 1.2424422050978068, "mse_loss": 0.058360543102025986, "step": 10480 }, { "epoch": 1.2436277415530528, "grad_norm": 0.5078125, "learning_rate": 0.00019642404035405582, "loss": 0.8633, "step": 10490 }, { "contrastive_loss": 3.96240234375, "epoch": 1.2436277415530528, "mse_loss": 0.05461365729570389, "step": 10490 }, { "epoch": 1.2448132780082988, "grad_norm": 0.71484375, "learning_rate": 0.00019641307667422507, "loss": 0.859, "step": 10500 }, { "contrastive_loss": 3.9796142578125, "epoch": 1.2448132780082988, "mse_loss": 0.05810568109154701, "step": 10500 }, { "epoch": 1.2459988144635448, "grad_norm": 0.42578125, "learning_rate": 0.00019640209652003644, "loss": 0.8605, "step": 10510 }, { "contrastive_loss": 3.85693359375, "epoch": 1.2459988144635448, "mse_loss": 0.07582148164510727, "step": 10510 }, { "epoch": 1.2471843509187908, "grad_norm": 0.5234375, "learning_rate": 0.0001963910998933661, "loss": 0.8521, "step": 10520 }, { "contrastive_loss": 4.0716552734375, "epoch": 1.2471843509187908, "mse_loss": 0.054254282265901566, "step": 10520 }, { "epoch": 1.2483698873740368, "grad_norm": 0.4140625, "learning_rate": 0.00019638008679609309, "loss": 0.8584, "step": 10530 }, { "contrastive_loss": 4.0374755859375, "epoch": 1.2483698873740368, "mse_loss": 0.0896749347448349, "step": 10530 }, { "epoch": 1.2495554238292828, "grad_norm": 0.42578125, "learning_rate": 0.00019636905723009922, "loss": 0.8684, "step": 10540 }, { "contrastive_loss": 3.8572998046875, "epoch": 1.2495554238292828, "mse_loss": 0.08440651744604111, "step": 10540 }, { "epoch": 1.2507409602845287, "grad_norm": 0.416015625, "learning_rate": 0.0001963580111972692, "loss": 0.8582, "step": 10550 }, { "contrastive_loss": 3.9144287109375, "epoch": 1.2507409602845287, "mse_loss": 0.10915134102106094, "step": 10550 }, { "epoch": 1.2519264967397747, "grad_norm": 0.703125, "learning_rate": 0.00019634694869949046, "loss": 0.863, "step": 10560 }, { "contrastive_loss": 3.912841796875, "epoch": 1.2519264967397747, "mse_loss": 0.06066127493977547, "step": 10560 }, { "epoch": 1.2531120331950207, "grad_norm": 0.486328125, "learning_rate": 0.00019633586973865329, "loss": 0.8539, "step": 10570 }, { "contrastive_loss": 4.0548095703125, "epoch": 1.2531120331950207, "mse_loss": 0.05207375809550285, "step": 10570 }, { "epoch": 1.2542975696502667, "grad_norm": 0.48046875, "learning_rate": 0.00019632477431665075, "loss": 0.8523, "step": 10580 }, { "contrastive_loss": 3.992431640625, "epoch": 1.2542975696502667, "mse_loss": 0.06098190322518349, "step": 10580 }, { "epoch": 1.2554831061055127, "grad_norm": 0.609375, "learning_rate": 0.00019631366243537878, "loss": 0.8661, "step": 10590 }, { "contrastive_loss": 3.9132080078125, "epoch": 1.2554831061055127, "mse_loss": 0.06435463577508926, "step": 10590 }, { "epoch": 1.2566686425607587, "grad_norm": 0.49609375, "learning_rate": 0.00019630253409673608, "loss": 0.8612, "step": 10600 }, { "contrastive_loss": 3.89453125, "epoch": 1.2566686425607587, "mse_loss": 0.061603154987096786, "step": 10600 }, { "epoch": 1.2578541790160047, "grad_norm": 0.49609375, "learning_rate": 0.0001962913893026242, "loss": 0.853, "step": 10610 }, { "contrastive_loss": 3.947021484375, "epoch": 1.2578541790160047, "mse_loss": 0.05266295745968819, "step": 10610 }, { "epoch": 1.2590397154712507, "grad_norm": 0.3828125, "learning_rate": 0.00019628022805494747, "loss": 0.8672, "step": 10620 }, { "contrastive_loss": 3.9437255859375, "epoch": 1.2590397154712507, "mse_loss": 0.1076400950551033, "step": 10620 }, { "epoch": 1.2602252519264967, "grad_norm": 0.458984375, "learning_rate": 0.00019626905035561302, "loss": 0.8663, "step": 10630 }, { "contrastive_loss": 3.7744140625, "epoch": 1.2602252519264967, "mse_loss": 0.06405695527791977, "step": 10630 }, { "epoch": 1.2614107883817427, "grad_norm": 0.51953125, "learning_rate": 0.0001962578562065308, "loss": 0.861, "step": 10640 }, { "contrastive_loss": 4.0391845703125, "epoch": 1.2614107883817427, "mse_loss": 0.05420259013772011, "step": 10640 }, { "epoch": 1.2625963248369887, "grad_norm": 0.455078125, "learning_rate": 0.00019624664560961367, "loss": 0.8646, "step": 10650 }, { "contrastive_loss": 3.949951171875, "epoch": 1.2625963248369887, "mse_loss": 0.08704038709402084, "step": 10650 }, { "epoch": 1.2637818612922347, "grad_norm": 0.35546875, "learning_rate": 0.00019623541856677708, "loss": 0.8585, "step": 10660 }, { "contrastive_loss": 3.8956298828125, "epoch": 1.2637818612922347, "mse_loss": 0.08698832243680954, "step": 10660 }, { "epoch": 1.2649673977474807, "grad_norm": 0.51171875, "learning_rate": 0.00019622417507993958, "loss": 0.852, "step": 10670 }, { "contrastive_loss": 3.9566650390625, "epoch": 1.2649673977474807, "mse_loss": 0.07618880271911621, "step": 10670 }, { "epoch": 1.2661529342027267, "grad_norm": 0.39453125, "learning_rate": 0.00019621291515102226, "loss": 0.8657, "step": 10680 }, { "contrastive_loss": 3.9581298828125, "epoch": 1.2661529342027267, "mse_loss": 0.0629720464348793, "step": 10680 }, { "epoch": 1.2673384706579727, "grad_norm": 0.5, "learning_rate": 0.00019620163878194917, "loss": 0.859, "step": 10690 }, { "contrastive_loss": 3.862548828125, "epoch": 1.2673384706579727, "mse_loss": 0.06136145815253258, "step": 10690 }, { "epoch": 1.2685240071132187, "grad_norm": 0.53515625, "learning_rate": 0.00019619034597464713, "loss": 0.8537, "step": 10700 }, { "contrastive_loss": 3.91455078125, "epoch": 1.2685240071132187, "mse_loss": 0.058251552283763885, "step": 10700 }, { "epoch": 1.2697095435684647, "grad_norm": 0.5, "learning_rate": 0.0001961790367310458, "loss": 0.8527, "step": 10710 }, { "contrastive_loss": 3.940673828125, "epoch": 1.2697095435684647, "mse_loss": 0.061115868389606476, "step": 10710 }, { "epoch": 1.2708950800237107, "grad_norm": 0.423828125, "learning_rate": 0.00019616771105307755, "loss": 0.8438, "step": 10720 }, { "contrastive_loss": 3.95556640625, "epoch": 1.2708950800237107, "mse_loss": 0.048750076442956924, "step": 10720 }, { "epoch": 1.2720806164789566, "grad_norm": 0.404296875, "learning_rate": 0.00019615636894267772, "loss": 0.8488, "step": 10730 }, { "contrastive_loss": 3.87109375, "epoch": 1.2720806164789566, "mse_loss": 0.08353202790021896, "step": 10730 }, { "epoch": 1.2732661529342026, "grad_norm": 0.474609375, "learning_rate": 0.0001961450104017843, "loss": 0.8586, "step": 10740 }, { "contrastive_loss": 3.9205322265625, "epoch": 1.2732661529342026, "mse_loss": 0.08203167468309402, "step": 10740 }, { "epoch": 1.2744516893894486, "grad_norm": 0.6328125, "learning_rate": 0.00019613363543233815, "loss": 0.8631, "step": 10750 }, { "contrastive_loss": 3.8433837890625, "epoch": 1.2744516893894486, "mse_loss": 0.060573678463697433, "step": 10750 }, { "epoch": 1.2756372258446946, "grad_norm": 0.53125, "learning_rate": 0.000196122244036283, "loss": 0.8536, "step": 10760 }, { "contrastive_loss": 4.0030517578125, "epoch": 1.2756372258446946, "mse_loss": 0.05790631100535393, "step": 10760 }, { "epoch": 1.2768227622999406, "grad_norm": 0.51171875, "learning_rate": 0.0001961108362155653, "loss": 0.8647, "step": 10770 }, { "contrastive_loss": 3.884521484375, "epoch": 1.2768227622999406, "mse_loss": 0.09682460874319077, "step": 10770 }, { "epoch": 1.2780082987551866, "grad_norm": 0.60546875, "learning_rate": 0.0001960994119721343, "loss": 0.864, "step": 10780 }, { "contrastive_loss": 3.834716796875, "epoch": 1.2780082987551866, "mse_loss": 0.10280445963144302, "step": 10780 }, { "epoch": 1.2791938352104326, "grad_norm": 0.48046875, "learning_rate": 0.00019608797130794213, "loss": 0.8588, "step": 10790 }, { "contrastive_loss": 3.9771728515625, "epoch": 1.2791938352104326, "mse_loss": 0.06963939219713211, "step": 10790 }, { "epoch": 1.2803793716656786, "grad_norm": 0.53125, "learning_rate": 0.00019607651422494366, "loss": 0.8582, "step": 10800 }, { "contrastive_loss": 3.9591064453125, "epoch": 1.2803793716656786, "mse_loss": 0.053943734616041183, "step": 10800 }, { "epoch": 1.2815649081209246, "grad_norm": 0.60546875, "learning_rate": 0.00019606504072509662, "loss": 0.864, "step": 10810 }, { "contrastive_loss": 3.93408203125, "epoch": 1.2815649081209246, "mse_loss": 0.059684883803129196, "step": 10810 }, { "epoch": 1.2827504445761706, "grad_norm": 0.484375, "learning_rate": 0.00019605355081036153, "loss": 0.8716, "step": 10820 }, { "contrastive_loss": 3.9556884765625, "epoch": 1.2827504445761706, "mse_loss": 0.06089723855257034, "step": 10820 }, { "epoch": 1.2839359810314166, "grad_norm": 0.40234375, "learning_rate": 0.00019604204448270162, "loss": 0.8587, "step": 10830 }, { "contrastive_loss": 3.95068359375, "epoch": 1.2839359810314166, "mse_loss": 0.08247977495193481, "step": 10830 }, { "epoch": 1.2851215174866626, "grad_norm": 0.498046875, "learning_rate": 0.0001960305217440831, "loss": 0.862, "step": 10840 }, { "contrastive_loss": 3.9176025390625, "epoch": 1.2851215174866626, "mse_loss": 0.08514125645160675, "step": 10840 }, { "epoch": 1.2863070539419086, "grad_norm": 0.640625, "learning_rate": 0.00019601898259647487, "loss": 0.8542, "step": 10850 }, { "contrastive_loss": 3.8099365234375, "epoch": 1.2863070539419086, "mse_loss": 0.06362811475992203, "step": 10850 }, { "epoch": 1.2874925903971546, "grad_norm": 0.5546875, "learning_rate": 0.0001960074270418486, "loss": 0.8583, "step": 10860 }, { "contrastive_loss": 3.87890625, "epoch": 1.2874925903971546, "mse_loss": 0.05077942833304405, "step": 10860 }, { "epoch": 1.2886781268524006, "grad_norm": 0.45703125, "learning_rate": 0.00019599585508217891, "loss": 0.8443, "step": 10870 }, { "contrastive_loss": 3.9552001953125, "epoch": 1.2886781268524006, "mse_loss": 0.06741485744714737, "step": 10870 }, { "epoch": 1.2898636633076468, "grad_norm": 0.45703125, "learning_rate": 0.00019598426671944304, "loss": 0.8622, "step": 10880 }, { "contrastive_loss": 3.9171142578125, "epoch": 1.2898636633076468, "mse_loss": 0.0649196058511734, "step": 10880 }, { "epoch": 1.2910491997628928, "grad_norm": 0.419921875, "learning_rate": 0.00019597266195562116, "loss": 0.8526, "step": 10890 }, { "contrastive_loss": 3.7808837890625, "epoch": 1.2910491997628928, "mse_loss": 0.06375245749950409, "step": 10890 }, { "epoch": 1.2922347362181388, "grad_norm": 0.6171875, "learning_rate": 0.0001959610407926962, "loss": 0.8581, "step": 10900 }, { "contrastive_loss": 3.9925537109375, "epoch": 1.2922347362181388, "mse_loss": 0.07829879224300385, "step": 10900 }, { "epoch": 1.2934202726733848, "grad_norm": 0.439453125, "learning_rate": 0.00019594940323265395, "loss": 0.8624, "step": 10910 }, { "contrastive_loss": 3.894287109375, "epoch": 1.2934202726733848, "mse_loss": 0.06777294725179672, "step": 10910 }, { "epoch": 1.2946058091286308, "grad_norm": 0.41015625, "learning_rate": 0.0001959377492774829, "loss": 0.8564, "step": 10920 }, { "contrastive_loss": 4.00341796875, "epoch": 1.2946058091286308, "mse_loss": 0.06710954010486603, "step": 10920 }, { "epoch": 1.2957913455838768, "grad_norm": 0.66015625, "learning_rate": 0.00019592607892917436, "loss": 0.8645, "step": 10930 }, { "contrastive_loss": 3.8160400390625, "epoch": 1.2957913455838768, "mse_loss": 0.08821123093366623, "step": 10930 }, { "epoch": 1.2969768820391228, "grad_norm": 0.50390625, "learning_rate": 0.00019591439218972253, "loss": 0.8664, "step": 10940 }, { "contrastive_loss": 3.9561767578125, "epoch": 1.2969768820391228, "mse_loss": 0.08641320466995239, "step": 10940 }, { "epoch": 1.2981624184943688, "grad_norm": 0.49609375, "learning_rate": 0.00019590268906112437, "loss": 0.8618, "step": 10950 }, { "contrastive_loss": 3.763671875, "epoch": 1.2981624184943688, "mse_loss": 0.061915989965200424, "step": 10950 }, { "epoch": 1.2993479549496147, "grad_norm": 0.46875, "learning_rate": 0.00019589096954537958, "loss": 0.8509, "step": 10960 }, { "contrastive_loss": 4.014404296875, "epoch": 1.2993479549496147, "mse_loss": 0.06866598129272461, "step": 10960 }, { "epoch": 1.3005334914048607, "grad_norm": 0.4609375, "learning_rate": 0.00019587923364449073, "loss": 0.8515, "step": 10970 }, { "contrastive_loss": 4.1143798828125, "epoch": 1.3005334914048607, "mse_loss": 0.08019731193780899, "step": 10970 }, { "epoch": 1.3017190278601067, "grad_norm": 0.5234375, "learning_rate": 0.0001958674813604631, "loss": 0.8577, "step": 10980 }, { "contrastive_loss": 3.8753662109375, "epoch": 1.3017190278601067, "mse_loss": 0.050462186336517334, "step": 10980 }, { "epoch": 1.3029045643153527, "grad_norm": 0.453125, "learning_rate": 0.00019585571269530494, "loss": 0.859, "step": 10990 }, { "contrastive_loss": 4.01611328125, "epoch": 1.3029045643153527, "mse_loss": 0.05853644013404846, "step": 10990 }, { "epoch": 1.3040901007705987, "grad_norm": 0.45703125, "learning_rate": 0.00019584392765102714, "loss": 0.8702, "step": 11000 }, { "contrastive_loss": 3.8836669921875, "epoch": 1.3040901007705987, "mse_loss": 0.05655742436647415, "step": 11000 }, { "epoch": 1.3052756372258447, "grad_norm": 0.33984375, "learning_rate": 0.00019583212622964341, "loss": 0.8503, "step": 11010 }, { "contrastive_loss": 4.0521240234375, "epoch": 1.3052756372258447, "mse_loss": 0.09252266585826874, "step": 11010 }, { "epoch": 1.3064611736810907, "grad_norm": 0.55859375, "learning_rate": 0.00019582030843317037, "loss": 0.8645, "step": 11020 }, { "contrastive_loss": 3.8623046875, "epoch": 1.3064611736810907, "mse_loss": 0.11039694398641586, "step": 11020 }, { "epoch": 1.3076467101363367, "grad_norm": 0.53515625, "learning_rate": 0.00019580847426362724, "loss": 0.8668, "step": 11030 }, { "contrastive_loss": 3.895751953125, "epoch": 1.3076467101363367, "mse_loss": 0.056344423443078995, "step": 11030 }, { "epoch": 1.3088322465915827, "grad_norm": 0.447265625, "learning_rate": 0.00019579662372303628, "loss": 0.8489, "step": 11040 }, { "contrastive_loss": 3.949951171875, "epoch": 1.3088322465915827, "mse_loss": 0.07848302274942398, "step": 11040 }, { "epoch": 1.3100177830468287, "grad_norm": 0.474609375, "learning_rate": 0.00019578475681342235, "loss": 0.8557, "step": 11050 }, { "contrastive_loss": 4.0263671875, "epoch": 1.3100177830468287, "mse_loss": 0.05004411190748215, "step": 11050 }, { "epoch": 1.3112033195020747, "grad_norm": 0.57421875, "learning_rate": 0.0001957728735368132, "loss": 0.854, "step": 11060 }, { "contrastive_loss": 3.9468994140625, "epoch": 1.3112033195020747, "mse_loss": 0.11291459947824478, "step": 11060 }, { "epoch": 1.3123888559573207, "grad_norm": 0.46875, "learning_rate": 0.00019576097389523937, "loss": 0.8771, "step": 11070 }, { "contrastive_loss": 3.9710693359375, "epoch": 1.3123888559573207, "mse_loss": 0.07529043406248093, "step": 11070 }, { "epoch": 1.3135743924125667, "grad_norm": 0.46875, "learning_rate": 0.00019574905789073417, "loss": 0.8713, "step": 11080 }, { "contrastive_loss": 3.99462890625, "epoch": 1.3135743924125667, "mse_loss": 0.06493956595659256, "step": 11080 }, { "epoch": 1.3147599288678127, "grad_norm": 0.474609375, "learning_rate": 0.0001957371255253337, "loss": 0.8595, "step": 11090 }, { "contrastive_loss": 3.992919921875, "epoch": 1.3147599288678127, "mse_loss": 0.09635041654109955, "step": 11090 }, { "epoch": 1.3159454653230587, "grad_norm": 0.439453125, "learning_rate": 0.0001957251768010769, "loss": 0.8639, "step": 11100 }, { "contrastive_loss": 3.831298828125, "epoch": 1.3159454653230587, "mse_loss": 0.09976120293140411, "step": 11100 }, { "epoch": 1.3171310017783047, "grad_norm": 0.578125, "learning_rate": 0.00019571321172000546, "loss": 0.8684, "step": 11110 }, { "contrastive_loss": 3.906982421875, "epoch": 1.3171310017783047, "mse_loss": 0.06314428895711899, "step": 11110 }, { "epoch": 1.3183165382335507, "grad_norm": 0.451171875, "learning_rate": 0.00019570123028416392, "loss": 0.8505, "step": 11120 }, { "contrastive_loss": 3.9530029296875, "epoch": 1.3183165382335507, "mse_loss": 0.06789743900299072, "step": 11120 }, { "epoch": 1.3195020746887967, "grad_norm": 0.49609375, "learning_rate": 0.00019568923249559954, "loss": 0.8595, "step": 11130 }, { "contrastive_loss": 3.967529296875, "epoch": 1.3195020746887967, "mse_loss": 0.04812708869576454, "step": 11130 }, { "epoch": 1.3206876111440427, "grad_norm": 0.498046875, "learning_rate": 0.00019567721835636245, "loss": 0.8761, "step": 11140 }, { "contrastive_loss": 3.913330078125, "epoch": 1.3206876111440427, "mse_loss": 0.07406393438577652, "step": 11140 }, { "epoch": 1.3218731475992886, "grad_norm": 0.55078125, "learning_rate": 0.00019566518786850553, "loss": 0.8791, "step": 11150 }, { "contrastive_loss": 3.933349609375, "epoch": 1.3218731475992886, "mse_loss": 0.054720014333724976, "step": 11150 }, { "epoch": 1.3230586840545346, "grad_norm": 0.416015625, "learning_rate": 0.00019565314103408443, "loss": 0.8638, "step": 11160 }, { "contrastive_loss": 3.983154296875, "epoch": 1.3230586840545346, "mse_loss": 0.0704660639166832, "step": 11160 }, { "epoch": 1.3242442205097806, "grad_norm": 0.55859375, "learning_rate": 0.00019564107785515766, "loss": 0.8536, "step": 11170 }, { "contrastive_loss": 3.810546875, "epoch": 1.3242442205097806, "mse_loss": 0.08964085578918457, "step": 11170 }, { "epoch": 1.3254297569650266, "grad_norm": 0.51171875, "learning_rate": 0.00019562899833378648, "loss": 0.8568, "step": 11180 }, { "contrastive_loss": 4.0479736328125, "epoch": 1.3254297569650266, "mse_loss": 0.07091303169727325, "step": 11180 }, { "epoch": 1.3266152934202726, "grad_norm": 0.609375, "learning_rate": 0.00019561690247203492, "loss": 0.872, "step": 11190 }, { "contrastive_loss": 3.8818359375, "epoch": 1.3266152934202726, "mse_loss": 0.06545174866914749, "step": 11190 }, { "epoch": 1.3278008298755186, "grad_norm": 0.5078125, "learning_rate": 0.00019560479027196985, "loss": 0.8632, "step": 11200 }, { "contrastive_loss": 3.967529296875, "epoch": 1.3278008298755186, "mse_loss": 0.06514988094568253, "step": 11200 }, { "epoch": 1.3289863663307646, "grad_norm": 0.3984375, "learning_rate": 0.00019559266173566094, "loss": 0.8569, "step": 11210 }, { "contrastive_loss": 3.979736328125, "epoch": 1.3289863663307646, "mse_loss": 0.06035405769944191, "step": 11210 }, { "epoch": 1.3301719027860106, "grad_norm": 0.55078125, "learning_rate": 0.00019558051686518061, "loss": 0.8618, "step": 11220 }, { "contrastive_loss": 3.9080810546875, "epoch": 1.3301719027860106, "mse_loss": 0.07989169657230377, "step": 11220 }, { "epoch": 1.3313574392412566, "grad_norm": 0.392578125, "learning_rate": 0.00019556835566260407, "loss": 0.8642, "step": 11230 }, { "contrastive_loss": 3.88671875, "epoch": 1.3313574392412566, "mse_loss": 0.06797122210264206, "step": 11230 }, { "epoch": 1.3325429756965026, "grad_norm": 0.3515625, "learning_rate": 0.00019555617813000936, "loss": 0.8502, "step": 11240 }, { "contrastive_loss": 4.015869140625, "epoch": 1.3325429756965026, "mse_loss": 0.07078112661838531, "step": 11240 }, { "epoch": 1.3337285121517486, "grad_norm": 0.46875, "learning_rate": 0.00019554398426947724, "loss": 0.8672, "step": 11250 }, { "contrastive_loss": 3.9488525390625, "epoch": 1.3337285121517486, "mse_loss": 0.07023141533136368, "step": 11250 }, { "epoch": 1.3349140486069946, "grad_norm": 0.4609375, "learning_rate": 0.0001955317740830914, "loss": 0.8668, "step": 11260 }, { "contrastive_loss": 3.8740234375, "epoch": 1.3349140486069946, "mse_loss": 0.059867922216653824, "step": 11260 }, { "epoch": 1.3360995850622408, "grad_norm": 0.41015625, "learning_rate": 0.00019551954757293812, "loss": 0.8508, "step": 11270 }, { "contrastive_loss": 3.8902587890625, "epoch": 1.3360995850622408, "mse_loss": 0.08276408165693283, "step": 11270 }, { "epoch": 1.3372851215174868, "grad_norm": 0.51171875, "learning_rate": 0.00019550730474110663, "loss": 0.8536, "step": 11280 }, { "contrastive_loss": 3.98779296875, "epoch": 1.3372851215174868, "mse_loss": 0.07494653016328812, "step": 11280 }, { "epoch": 1.3384706579727328, "grad_norm": 0.55078125, "learning_rate": 0.0001954950455896889, "loss": 0.8736, "step": 11290 }, { "contrastive_loss": 3.951904296875, "epoch": 1.3384706579727328, "mse_loss": 0.0728529691696167, "step": 11290 }, { "epoch": 1.3396561944279788, "grad_norm": 0.478515625, "learning_rate": 0.00019548277012077967, "loss": 0.8628, "step": 11300 }, { "contrastive_loss": 4.0570068359375, "epoch": 1.3396561944279788, "mse_loss": 0.05531611293554306, "step": 11300 }, { "epoch": 1.3408417308832248, "grad_norm": 0.431640625, "learning_rate": 0.00019547047833647652, "loss": 0.8519, "step": 11310 }, { "contrastive_loss": 3.968017578125, "epoch": 1.3408417308832248, "mse_loss": 0.07162908464670181, "step": 11310 }, { "epoch": 1.3420272673384708, "grad_norm": 0.404296875, "learning_rate": 0.0001954581702388797, "loss": 0.8564, "step": 11320 }, { "contrastive_loss": 3.9244384765625, "epoch": 1.3420272673384708, "mse_loss": 0.0651649683713913, "step": 11320 }, { "epoch": 1.3432128037937168, "grad_norm": 0.447265625, "learning_rate": 0.0001954458458300924, "loss": 0.8517, "step": 11330 }, { "contrastive_loss": 3.828369140625, "epoch": 1.3432128037937168, "mse_loss": 0.07458160072565079, "step": 11330 }, { "epoch": 1.3443983402489628, "grad_norm": 0.51171875, "learning_rate": 0.00019543350511222048, "loss": 0.8641, "step": 11340 }, { "contrastive_loss": 4.0107421875, "epoch": 1.3443983402489628, "mse_loss": 0.07709860056638718, "step": 11340 }, { "epoch": 1.3455838767042088, "grad_norm": 0.447265625, "learning_rate": 0.00019542114808737264, "loss": 0.8536, "step": 11350 }, { "contrastive_loss": 4.0234375, "epoch": 1.3455838767042088, "mse_loss": 0.06299971789121628, "step": 11350 }, { "epoch": 1.3467694131594548, "grad_norm": 0.41796875, "learning_rate": 0.00019540877475766037, "loss": 0.8427, "step": 11360 }, { "contrastive_loss": 3.934814453125, "epoch": 1.3467694131594548, "mse_loss": 0.04730408638715744, "step": 11360 }, { "epoch": 1.3479549496147007, "grad_norm": 0.416015625, "learning_rate": 0.00019539638512519795, "loss": 0.8607, "step": 11370 }, { "contrastive_loss": 3.8919677734375, "epoch": 1.3479549496147007, "mse_loss": 0.06489202380180359, "step": 11370 }, { "epoch": 1.3491404860699467, "grad_norm": 0.609375, "learning_rate": 0.00019538397919210238, "loss": 0.856, "step": 11380 }, { "contrastive_loss": 3.9229736328125, "epoch": 1.3491404860699467, "mse_loss": 0.06860911846160889, "step": 11380 }, { "epoch": 1.3503260225251927, "grad_norm": 0.435546875, "learning_rate": 0.00019537155696049355, "loss": 0.8499, "step": 11390 }, { "contrastive_loss": 3.8900146484375, "epoch": 1.3503260225251927, "mse_loss": 0.07629521936178207, "step": 11390 }, { "epoch": 1.3515115589804387, "grad_norm": 0.4765625, "learning_rate": 0.00019535911843249405, "loss": 0.8575, "step": 11400 }, { "contrastive_loss": 3.8428955078125, "epoch": 1.3515115589804387, "mse_loss": 0.06030631437897682, "step": 11400 }, { "epoch": 1.3526970954356847, "grad_norm": 0.41796875, "learning_rate": 0.0001953466636102293, "loss": 0.8558, "step": 11410 }, { "contrastive_loss": 3.8853759765625, "epoch": 1.3526970954356847, "mse_loss": 0.06871069222688675, "step": 11410 }, { "epoch": 1.3538826318909307, "grad_norm": 0.5546875, "learning_rate": 0.00019533419249582746, "loss": 0.8528, "step": 11420 }, { "contrastive_loss": 3.9891357421875, "epoch": 1.3538826318909307, "mse_loss": 0.06240134313702583, "step": 11420 }, { "epoch": 1.3550681683461767, "grad_norm": 0.66796875, "learning_rate": 0.0001953217050914195, "loss": 0.8698, "step": 11430 }, { "contrastive_loss": 4.0118408203125, "epoch": 1.3550681683461767, "mse_loss": 0.06289966404438019, "step": 11430 }, { "epoch": 1.3562537048014227, "grad_norm": 0.466796875, "learning_rate": 0.0001953092013991392, "loss": 0.8693, "step": 11440 }, { "contrastive_loss": 3.8572998046875, "epoch": 1.3562537048014227, "mse_loss": 0.03788324445486069, "step": 11440 }, { "epoch": 1.3574392412566687, "grad_norm": 0.380859375, "learning_rate": 0.0001952966814211231, "loss": 0.8584, "step": 11450 }, { "contrastive_loss": 4.027099609375, "epoch": 1.3574392412566687, "mse_loss": 0.10394131392240524, "step": 11450 }, { "epoch": 1.3586247777119147, "grad_norm": 0.373046875, "learning_rate": 0.00019528414515951052, "loss": 0.863, "step": 11460 }, { "contrastive_loss": 4.0458984375, "epoch": 1.3586247777119147, "mse_loss": 0.0812213197350502, "step": 11460 }, { "epoch": 1.3598103141671607, "grad_norm": 0.37109375, "learning_rate": 0.00019527159261644358, "loss": 0.8689, "step": 11470 }, { "contrastive_loss": 3.8636474609375, "epoch": 1.3598103141671607, "mse_loss": 0.08645908534526825, "step": 11470 }, { "epoch": 1.3609958506224067, "grad_norm": 0.6484375, "learning_rate": 0.00019525902379406712, "loss": 0.8623, "step": 11480 }, { "contrastive_loss": 3.95458984375, "epoch": 1.3609958506224067, "mse_loss": 0.07865112274885178, "step": 11480 }, { "epoch": 1.3621813870776527, "grad_norm": 0.64453125, "learning_rate": 0.00019524643869452883, "loss": 0.8624, "step": 11490 }, { "contrastive_loss": 3.9520263671875, "epoch": 1.3621813870776527, "mse_loss": 0.06504561007022858, "step": 11490 }, { "epoch": 1.3633669235328987, "grad_norm": 0.4296875, "learning_rate": 0.00019523383731997917, "loss": 0.86, "step": 11500 }, { "contrastive_loss": 3.9525146484375, "epoch": 1.3633669235328987, "mse_loss": 0.07477208226919174, "step": 11500 }, { "epoch": 1.3645524599881447, "grad_norm": 0.49609375, "learning_rate": 0.0001952212196725714, "loss": 0.8689, "step": 11510 }, { "contrastive_loss": 3.828857421875, "epoch": 1.3645524599881447, "mse_loss": 0.07703007757663727, "step": 11510 }, { "epoch": 1.3657379964433907, "grad_norm": 0.53125, "learning_rate": 0.00019520858575446145, "loss": 0.8583, "step": 11520 }, { "contrastive_loss": 3.9400634765625, "epoch": 1.3657379964433907, "mse_loss": 0.0743480697274208, "step": 11520 }, { "epoch": 1.3669235328986367, "grad_norm": 0.498046875, "learning_rate": 0.00019519593556780812, "loss": 0.8656, "step": 11530 }, { "contrastive_loss": 3.8751220703125, "epoch": 1.3669235328986367, "mse_loss": 0.04796851426362991, "step": 11530 }, { "epoch": 1.3681090693538827, "grad_norm": 0.515625, "learning_rate": 0.00019518326911477306, "loss": 0.8535, "step": 11540 }, { "contrastive_loss": 3.9210205078125, "epoch": 1.3681090693538827, "mse_loss": 0.06058189645409584, "step": 11540 }, { "epoch": 1.3692946058091287, "grad_norm": 0.6640625, "learning_rate": 0.0001951705863975206, "loss": 0.8592, "step": 11550 }, { "contrastive_loss": 3.9171142578125, "epoch": 1.3692946058091287, "mse_loss": 0.060221750289201736, "step": 11550 }, { "epoch": 1.3704801422643746, "grad_norm": 0.494140625, "learning_rate": 0.00019515788741821782, "loss": 0.854, "step": 11560 }, { "contrastive_loss": 3.9765625, "epoch": 1.3704801422643746, "mse_loss": 0.06260965764522552, "step": 11560 }, { "epoch": 1.3716656787196206, "grad_norm": 0.5234375, "learning_rate": 0.00019514517217903465, "loss": 0.8548, "step": 11570 }, { "contrastive_loss": 3.951171875, "epoch": 1.3716656787196206, "mse_loss": 0.0685577467083931, "step": 11570 }, { "epoch": 1.3728512151748666, "grad_norm": 0.384765625, "learning_rate": 0.0001951324406821438, "loss": 0.8612, "step": 11580 }, { "contrastive_loss": 3.8375244140625, "epoch": 1.3728512151748666, "mse_loss": 0.07468608766794205, "step": 11580 }, { "epoch": 1.3740367516301126, "grad_norm": 0.5, "learning_rate": 0.00019511969292972068, "loss": 0.8551, "step": 11590 }, { "contrastive_loss": 3.7777099609375, "epoch": 1.3740367516301126, "mse_loss": 0.04901688173413277, "step": 11590 }, { "epoch": 1.3752222880853586, "grad_norm": 0.515625, "learning_rate": 0.0001951069289239436, "loss": 0.8596, "step": 11600 }, { "contrastive_loss": 4.0113525390625, "epoch": 1.3752222880853586, "mse_loss": 0.06789617240428925, "step": 11600 }, { "epoch": 1.3764078245406046, "grad_norm": 0.50390625, "learning_rate": 0.00019509414866699352, "loss": 0.854, "step": 11610 }, { "contrastive_loss": 3.916015625, "epoch": 1.3764078245406046, "mse_loss": 0.07959004491567612, "step": 11610 }, { "epoch": 1.3775933609958506, "grad_norm": 0.5859375, "learning_rate": 0.0001950813521610543, "loss": 0.862, "step": 11620 }, { "contrastive_loss": 3.8685302734375, "epoch": 1.3775933609958506, "mse_loss": 0.07947365194559097, "step": 11620 }, { "epoch": 1.3787788974510966, "grad_norm": 0.41015625, "learning_rate": 0.00019506853940831243, "loss": 0.8528, "step": 11630 }, { "contrastive_loss": 3.84423828125, "epoch": 1.3787788974510966, "mse_loss": 0.07521678507328033, "step": 11630 }, { "epoch": 1.3799644339063426, "grad_norm": 0.451171875, "learning_rate": 0.00019505571041095735, "loss": 0.8577, "step": 11640 }, { "contrastive_loss": 3.947021484375, "epoch": 1.3799644339063426, "mse_loss": 0.06042451411485672, "step": 11640 }, { "epoch": 1.3811499703615886, "grad_norm": 0.5390625, "learning_rate": 0.00019504286517118112, "loss": 0.8615, "step": 11650 }, { "contrastive_loss": 4.0869140625, "epoch": 1.3811499703615886, "mse_loss": 0.07258334010839462, "step": 11650 }, { "epoch": 1.3823355068168346, "grad_norm": 0.42578125, "learning_rate": 0.00019503000369117866, "loss": 0.8491, "step": 11660 }, { "contrastive_loss": 3.8782958984375, "epoch": 1.3823355068168346, "mse_loss": 0.06585852801799774, "step": 11660 }, { "epoch": 1.3835210432720806, "grad_norm": 0.392578125, "learning_rate": 0.00019501712597314765, "loss": 0.8456, "step": 11670 }, { "contrastive_loss": 3.86962890625, "epoch": 1.3835210432720806, "mse_loss": 0.07132317870855331, "step": 11670 }, { "epoch": 1.3847065797273266, "grad_norm": 0.484375, "learning_rate": 0.00019500423201928855, "loss": 0.8495, "step": 11680 }, { "contrastive_loss": 3.896240234375, "epoch": 1.3847065797273266, "mse_loss": 0.055467069149017334, "step": 11680 }, { "epoch": 1.3858921161825726, "grad_norm": 0.43359375, "learning_rate": 0.00019499132183180452, "loss": 0.8555, "step": 11690 }, { "contrastive_loss": 3.894775390625, "epoch": 1.3858921161825726, "mse_loss": 0.06590113043785095, "step": 11690 }, { "epoch": 1.3870776526378186, "grad_norm": 0.4765625, "learning_rate": 0.00019497839541290167, "loss": 0.8531, "step": 11700 }, { "contrastive_loss": 3.9586181640625, "epoch": 1.3870776526378186, "mse_loss": 0.09253861010074615, "step": 11700 }, { "epoch": 1.3882631890930646, "grad_norm": 0.392578125, "learning_rate": 0.00019496545276478865, "loss": 0.8614, "step": 11710 }, { "contrastive_loss": 3.8798828125, "epoch": 1.3882631890930646, "mse_loss": 0.08795236051082611, "step": 11710 }, { "epoch": 1.3894487255483106, "grad_norm": 0.4375, "learning_rate": 0.0001949524938896771, "loss": 0.8537, "step": 11720 }, { "contrastive_loss": 3.9874267578125, "epoch": 1.3894487255483106, "mse_loss": 0.07489226758480072, "step": 11720 }, { "epoch": 1.3906342620035566, "grad_norm": 0.5078125, "learning_rate": 0.0001949395187897813, "loss": 0.8635, "step": 11730 }, { "contrastive_loss": 3.985595703125, "epoch": 1.3906342620035566, "mse_loss": 0.05532357841730118, "step": 11730 }, { "epoch": 1.3918197984588025, "grad_norm": 0.466796875, "learning_rate": 0.00019492652746731836, "loss": 0.8482, "step": 11740 }, { "contrastive_loss": 3.850830078125, "epoch": 1.3918197984588025, "mse_loss": 0.09159344434738159, "step": 11740 }, { "epoch": 1.3930053349140485, "grad_norm": 0.53125, "learning_rate": 0.00019491351992450805, "loss": 0.8514, "step": 11750 }, { "contrastive_loss": 3.8216552734375, "epoch": 1.3930053349140485, "mse_loss": 0.07109618932008743, "step": 11750 }, { "epoch": 1.3941908713692945, "grad_norm": 0.43359375, "learning_rate": 0.00019490049616357314, "loss": 0.8628, "step": 11760 }, { "contrastive_loss": 3.9384765625, "epoch": 1.3941908713692945, "mse_loss": 0.04828047752380371, "step": 11760 }, { "epoch": 1.3953764078245405, "grad_norm": 0.4765625, "learning_rate": 0.00019488745618673894, "loss": 0.8534, "step": 11770 }, { "contrastive_loss": 3.8887939453125, "epoch": 1.3953764078245405, "mse_loss": 0.07806825637817383, "step": 11770 }, { "epoch": 1.3965619442797865, "grad_norm": 0.484375, "learning_rate": 0.00019487439999623364, "loss": 0.8537, "step": 11780 }, { "contrastive_loss": 3.871337890625, "epoch": 1.3965619442797865, "mse_loss": 0.055810995399951935, "step": 11780 }, { "epoch": 1.3977474807350325, "grad_norm": 0.625, "learning_rate": 0.00019486132759428823, "loss": 0.845, "step": 11790 }, { "contrastive_loss": 3.8079833984375, "epoch": 1.3977474807350325, "mse_loss": 0.08297073096036911, "step": 11790 }, { "epoch": 1.3989330171902785, "grad_norm": 0.404296875, "learning_rate": 0.0001948482389831364, "loss": 0.8626, "step": 11800 }, { "contrastive_loss": 3.868896484375, "epoch": 1.3989330171902785, "mse_loss": 0.06597503274679184, "step": 11800 }, { "epoch": 1.4001185536455245, "grad_norm": 0.498046875, "learning_rate": 0.00019483513416501463, "loss": 0.8493, "step": 11810 }, { "contrastive_loss": 3.9849853515625, "epoch": 1.4001185536455245, "mse_loss": 0.05717841535806656, "step": 11810 }, { "epoch": 1.4013040901007705, "grad_norm": 0.484375, "learning_rate": 0.00019482201314216218, "loss": 0.8524, "step": 11820 }, { "contrastive_loss": 3.8687744140625, "epoch": 1.4013040901007705, "mse_loss": 0.09837799519300461, "step": 11820 }, { "epoch": 1.4024896265560165, "grad_norm": 0.484375, "learning_rate": 0.00019480887591682107, "loss": 0.8537, "step": 11830 }, { "contrastive_loss": 3.93359375, "epoch": 1.4024896265560165, "mse_loss": 0.06828854978084564, "step": 11830 }, { "epoch": 1.4036751630112625, "grad_norm": 0.54296875, "learning_rate": 0.0001947957224912361, "loss": 0.8469, "step": 11840 }, { "contrastive_loss": 3.8621826171875, "epoch": 1.4036751630112625, "mse_loss": 0.06154097989201546, "step": 11840 }, { "epoch": 1.4048606994665085, "grad_norm": 0.431640625, "learning_rate": 0.0001947825528676548, "loss": 0.8547, "step": 11850 }, { "contrastive_loss": 3.8035888671875, "epoch": 1.4048606994665085, "mse_loss": 0.04962761327624321, "step": 11850 }, { "epoch": 1.4060462359217545, "grad_norm": 0.498046875, "learning_rate": 0.00019476936704832754, "loss": 0.8504, "step": 11860 }, { "contrastive_loss": 3.9156494140625, "epoch": 1.4060462359217545, "mse_loss": 0.05507687106728554, "step": 11860 }, { "epoch": 1.4072317723770005, "grad_norm": 0.51171875, "learning_rate": 0.00019475616503550737, "loss": 0.8653, "step": 11870 }, { "contrastive_loss": 3.9083251953125, "epoch": 1.4072317723770005, "mse_loss": 0.05543080344796181, "step": 11870 }, { "epoch": 1.4084173088322465, "grad_norm": 0.462890625, "learning_rate": 0.00019474294683145024, "loss": 0.8437, "step": 11880 }, { "contrastive_loss": 4.0050048828125, "epoch": 1.4084173088322465, "mse_loss": 0.0693662241101265, "step": 11880 }, { "epoch": 1.4096028452874925, "grad_norm": 0.41796875, "learning_rate": 0.0001947297124384147, "loss": 0.8653, "step": 11890 }, { "contrastive_loss": 3.904541015625, "epoch": 1.4096028452874925, "mse_loss": 0.08211679011583328, "step": 11890 }, { "epoch": 1.4107883817427385, "grad_norm": 0.5, "learning_rate": 0.00019471646185866215, "loss": 0.8518, "step": 11900 }, { "contrastive_loss": 3.882080078125, "epoch": 1.4107883817427385, "mse_loss": 0.05587771534919739, "step": 11900 }, { "epoch": 1.4119739181979845, "grad_norm": 0.421875, "learning_rate": 0.00019470319509445677, "loss": 0.8497, "step": 11910 }, { "contrastive_loss": 3.87939453125, "epoch": 1.4119739181979845, "mse_loss": 0.09121201187372208, "step": 11910 }, { "epoch": 1.4131594546532305, "grad_norm": 0.41796875, "learning_rate": 0.0001946899121480655, "loss": 0.8475, "step": 11920 }, { "contrastive_loss": 3.8824462890625, "epoch": 1.4131594546532305, "mse_loss": 0.06435202062129974, "step": 11920 }, { "epoch": 1.4143449911084767, "grad_norm": 0.45703125, "learning_rate": 0.00019467661302175802, "loss": 0.85, "step": 11930 }, { "contrastive_loss": 3.9801025390625, "epoch": 1.4143449911084767, "mse_loss": 0.0615101158618927, "step": 11930 }, { "epoch": 1.4155305275637227, "grad_norm": 0.41796875, "learning_rate": 0.00019466329771780676, "loss": 0.8584, "step": 11940 }, { "contrastive_loss": 3.8270263671875, "epoch": 1.4155305275637227, "mse_loss": 0.07628381997346878, "step": 11940 }, { "epoch": 1.4167160640189687, "grad_norm": 0.52734375, "learning_rate": 0.00019464996623848698, "loss": 0.8493, "step": 11950 }, { "contrastive_loss": 3.877685546875, "epoch": 1.4167160640189687, "mse_loss": 0.040796853601932526, "step": 11950 }, { "epoch": 1.4179016004742147, "grad_norm": 0.5234375, "learning_rate": 0.00019463661858607666, "loss": 0.861, "step": 11960 }, { "contrastive_loss": 3.723876953125, "epoch": 1.4179016004742147, "mse_loss": 0.1093873605132103, "step": 11960 }, { "epoch": 1.4190871369294606, "grad_norm": 0.431640625, "learning_rate": 0.00019462325476285653, "loss": 0.8496, "step": 11970 }, { "contrastive_loss": 3.9490966796875, "epoch": 1.4190871369294606, "mse_loss": 0.0771762952208519, "step": 11970 }, { "epoch": 1.4202726733847066, "grad_norm": 0.427734375, "learning_rate": 0.00019460987477111012, "loss": 0.8502, "step": 11980 }, { "contrastive_loss": 4.0111083984375, "epoch": 1.4202726733847066, "mse_loss": 0.0689769983291626, "step": 11980 }, { "epoch": 1.4214582098399526, "grad_norm": 0.43359375, "learning_rate": 0.00019459647861312372, "loss": 0.8614, "step": 11990 }, { "contrastive_loss": 3.884521484375, "epoch": 1.4214582098399526, "mse_loss": 0.06779991835355759, "step": 11990 }, { "epoch": 1.4226437462951986, "grad_norm": 0.4375, "learning_rate": 0.00019458306629118632, "loss": 0.8592, "step": 12000 }, { "contrastive_loss": 3.885986328125, "epoch": 1.4226437462951986, "mse_loss": 0.0630585178732872, "step": 12000 }, { "epoch": 1.4238292827504446, "grad_norm": 0.470703125, "learning_rate": 0.00019456963780758972, "loss": 0.8575, "step": 12010 }, { "contrastive_loss": 4.044189453125, "epoch": 1.4238292827504446, "mse_loss": 0.06307963281869888, "step": 12010 }, { "epoch": 1.4250148192056906, "grad_norm": 0.40234375, "learning_rate": 0.00019455619316462855, "loss": 0.8578, "step": 12020 }, { "contrastive_loss": 3.9412841796875, "epoch": 1.4250148192056906, "mse_loss": 0.06565774232149124, "step": 12020 }, { "epoch": 1.4262003556609366, "grad_norm": 0.48828125, "learning_rate": 0.00019454273236460006, "loss": 0.867, "step": 12030 }, { "contrastive_loss": 3.967529296875, "epoch": 1.4262003556609366, "mse_loss": 0.0597669817507267, "step": 12030 }, { "epoch": 1.4273858921161826, "grad_norm": 0.5, "learning_rate": 0.00019452925540980437, "loss": 0.8436, "step": 12040 }, { "contrastive_loss": 3.959716796875, "epoch": 1.4273858921161826, "mse_loss": 0.0831957533955574, "step": 12040 }, { "epoch": 1.4285714285714286, "grad_norm": 0.470703125, "learning_rate": 0.00019451576230254428, "loss": 0.8556, "step": 12050 }, { "contrastive_loss": 3.9072265625, "epoch": 1.4285714285714286, "mse_loss": 0.0791270062327385, "step": 12050 }, { "epoch": 1.4297569650266746, "grad_norm": 0.5078125, "learning_rate": 0.00019450225304512548, "loss": 0.8531, "step": 12060 }, { "contrastive_loss": 3.8734130859375, "epoch": 1.4297569650266746, "mse_loss": 0.05587107688188553, "step": 12060 }, { "epoch": 1.4309425014819206, "grad_norm": 0.52734375, "learning_rate": 0.00019448872763985623, "loss": 0.8568, "step": 12070 }, { "contrastive_loss": 3.9730224609375, "epoch": 1.4309425014819206, "mse_loss": 0.05873574689030647, "step": 12070 }, { "epoch": 1.4321280379371666, "grad_norm": 0.7109375, "learning_rate": 0.00019447518608904773, "loss": 0.8597, "step": 12080 }, { "contrastive_loss": 3.868408203125, "epoch": 1.4321280379371666, "mse_loss": 0.07111247628927231, "step": 12080 }, { "epoch": 1.4333135743924126, "grad_norm": 0.494140625, "learning_rate": 0.0001944616283950138, "loss": 0.8596, "step": 12090 }, { "contrastive_loss": 3.8172607421875, "epoch": 1.4333135743924126, "mse_loss": 0.0764077827334404, "step": 12090 }, { "epoch": 1.4344991108476586, "grad_norm": 0.466796875, "learning_rate": 0.00019444805456007115, "loss": 0.8711, "step": 12100 }, { "contrastive_loss": 4.02197265625, "epoch": 1.4344991108476586, "mse_loss": 0.05399502441287041, "step": 12100 }, { "epoch": 1.4356846473029046, "grad_norm": 0.3984375, "learning_rate": 0.00019443446458653906, "loss": 0.8647, "step": 12110 }, { "contrastive_loss": 3.942138671875, "epoch": 1.4356846473029046, "mse_loss": 0.0876118615269661, "step": 12110 }, { "epoch": 1.4368701837581506, "grad_norm": 0.53515625, "learning_rate": 0.00019442085847673984, "loss": 0.8592, "step": 12120 }, { "contrastive_loss": 3.99462890625, "epoch": 1.4368701837581506, "mse_loss": 0.06800276041030884, "step": 12120 }, { "epoch": 1.4380557202133966, "grad_norm": 0.5078125, "learning_rate": 0.0001944072362329983, "loss": 0.8493, "step": 12130 }, { "contrastive_loss": 3.9410400390625, "epoch": 1.4380557202133966, "mse_loss": 0.0613919198513031, "step": 12130 }, { "epoch": 1.4392412566686426, "grad_norm": 0.376953125, "learning_rate": 0.00019439359785764212, "loss": 0.8449, "step": 12140 }, { "contrastive_loss": 3.8052978515625, "epoch": 1.4392412566686426, "mse_loss": 0.06299800425767899, "step": 12140 }, { "epoch": 1.4404267931238885, "grad_norm": 0.390625, "learning_rate": 0.0001943799433530017, "loss": 0.8628, "step": 12150 }, { "contrastive_loss": 3.911865234375, "epoch": 1.4404267931238885, "mse_loss": 0.10941774398088455, "step": 12150 }, { "epoch": 1.4416123295791345, "grad_norm": 0.44140625, "learning_rate": 0.0001943662727214103, "loss": 0.8613, "step": 12160 }, { "contrastive_loss": 3.8402099609375, "epoch": 1.4416123295791345, "mse_loss": 0.0646011009812355, "step": 12160 }, { "epoch": 1.4427978660343805, "grad_norm": 0.396484375, "learning_rate": 0.00019435258596520383, "loss": 0.8485, "step": 12170 }, { "contrastive_loss": 3.908447265625, "epoch": 1.4427978660343805, "mse_loss": 0.0832740068435669, "step": 12170 }, { "epoch": 1.4439834024896265, "grad_norm": 0.90234375, "learning_rate": 0.00019433888308672094, "loss": 0.858, "step": 12180 }, { "contrastive_loss": 3.9420166015625, "epoch": 1.4439834024896265, "mse_loss": 0.125848188996315, "step": 12180 }, { "epoch": 1.4451689389448725, "grad_norm": 0.455078125, "learning_rate": 0.00019432516408830313, "loss": 0.868, "step": 12190 }, { "contrastive_loss": 3.888427734375, "epoch": 1.4451689389448725, "mse_loss": 0.054541878402233124, "step": 12190 }, { "epoch": 1.4463544754001185, "grad_norm": 0.337890625, "learning_rate": 0.00019431142897229455, "loss": 0.837, "step": 12200 }, { "contrastive_loss": 3.7991943359375, "epoch": 1.4463544754001185, "mse_loss": 0.047035396099090576, "step": 12200 }, { "epoch": 1.4475400118553645, "grad_norm": 0.546875, "learning_rate": 0.0001942976777410422, "loss": 0.8716, "step": 12210 }, { "contrastive_loss": 3.8533935546875, "epoch": 1.4475400118553645, "mse_loss": 0.0678502544760704, "step": 12210 }, { "epoch": 1.4487255483106105, "grad_norm": 0.60546875, "learning_rate": 0.00019428391039689577, "loss": 0.8581, "step": 12220 }, { "contrastive_loss": 3.8167724609375, "epoch": 1.4487255483106105, "mse_loss": 0.053583528846502304, "step": 12220 }, { "epoch": 1.4499110847658565, "grad_norm": 0.51171875, "learning_rate": 0.00019427012694220772, "loss": 0.8559, "step": 12230 }, { "contrastive_loss": 3.95947265625, "epoch": 1.4499110847658565, "mse_loss": 0.05743829533457756, "step": 12230 }, { "epoch": 1.4510966212211025, "grad_norm": 0.470703125, "learning_rate": 0.00019425632737933324, "loss": 0.8555, "step": 12240 }, { "contrastive_loss": 3.7740478515625, "epoch": 1.4510966212211025, "mse_loss": 0.07766089588403702, "step": 12240 }, { "epoch": 1.4522821576763485, "grad_norm": 0.5546875, "learning_rate": 0.00019424251171063035, "loss": 0.8512, "step": 12250 }, { "contrastive_loss": 3.8133544921875, "epoch": 1.4522821576763485, "mse_loss": 0.07608337700366974, "step": 12250 }, { "epoch": 1.4534676941315945, "grad_norm": 0.53515625, "learning_rate": 0.00019422867993845977, "loss": 0.8518, "step": 12260 }, { "contrastive_loss": 3.86181640625, "epoch": 1.4534676941315945, "mse_loss": 0.11398851871490479, "step": 12260 }, { "epoch": 1.4546532305868405, "grad_norm": 0.443359375, "learning_rate": 0.0001942148320651849, "loss": 0.8558, "step": 12270 }, { "contrastive_loss": 3.9000244140625, "epoch": 1.4546532305868405, "mse_loss": 0.06382168084383011, "step": 12270 }, { "epoch": 1.4558387670420865, "grad_norm": 0.470703125, "learning_rate": 0.00019420096809317206, "loss": 0.8554, "step": 12280 }, { "contrastive_loss": 3.904296875, "epoch": 1.4558387670420865, "mse_loss": 0.06634820997714996, "step": 12280 }, { "epoch": 1.4570243034973325, "grad_norm": 0.65234375, "learning_rate": 0.00019418708802479016, "loss": 0.8461, "step": 12290 }, { "contrastive_loss": 3.95361328125, "epoch": 1.4570243034973325, "mse_loss": 0.052877943962812424, "step": 12290 }, { "epoch": 1.4582098399525785, "grad_norm": 0.46484375, "learning_rate": 0.00019417319186241093, "loss": 0.8501, "step": 12300 }, { "contrastive_loss": 3.9764404296875, "epoch": 1.4582098399525785, "mse_loss": 0.08141352236270905, "step": 12300 }, { "epoch": 1.4593953764078245, "grad_norm": 0.44921875, "learning_rate": 0.00019415927960840886, "loss": 0.8562, "step": 12310 }, { "contrastive_loss": 3.9971923828125, "epoch": 1.4593953764078245, "mse_loss": 0.0801076740026474, "step": 12310 }, { "epoch": 1.4605809128630705, "grad_norm": 0.45703125, "learning_rate": 0.00019414535126516117, "loss": 0.8629, "step": 12320 }, { "contrastive_loss": 3.96826171875, "epoch": 1.4605809128630705, "mse_loss": 0.08263860642910004, "step": 12320 }, { "epoch": 1.4617664493183167, "grad_norm": 0.4609375, "learning_rate": 0.0001941314068350478, "loss": 0.8496, "step": 12330 }, { "contrastive_loss": 3.8935546875, "epoch": 1.4617664493183167, "mse_loss": 0.06396383792161942, "step": 12330 }, { "epoch": 1.4629519857735627, "grad_norm": 0.50390625, "learning_rate": 0.00019411744632045154, "loss": 0.8634, "step": 12340 }, { "contrastive_loss": 3.9534912109375, "epoch": 1.4629519857735627, "mse_loss": 0.060742370784282684, "step": 12340 }, { "epoch": 1.4641375222288087, "grad_norm": 0.43359375, "learning_rate": 0.00019410346972375782, "loss": 0.8535, "step": 12350 }, { "contrastive_loss": 4.0137939453125, "epoch": 1.4641375222288087, "mse_loss": 0.06361784785985947, "step": 12350 }, { "epoch": 1.4653230586840547, "grad_norm": 0.408203125, "learning_rate": 0.00019408947704735482, "loss": 0.8543, "step": 12360 }, { "contrastive_loss": 3.910888671875, "epoch": 1.4653230586840547, "mse_loss": 0.0872921571135521, "step": 12360 }, { "epoch": 1.4665085951393007, "grad_norm": 0.474609375, "learning_rate": 0.0001940754682936336, "loss": 0.8565, "step": 12370 }, { "contrastive_loss": 3.796630859375, "epoch": 1.4665085951393007, "mse_loss": 0.08292458206415176, "step": 12370 }, { "epoch": 1.4676941315945466, "grad_norm": 0.515625, "learning_rate": 0.00019406144346498778, "loss": 0.8563, "step": 12380 }, { "contrastive_loss": 3.8507080078125, "epoch": 1.4676941315945466, "mse_loss": 0.0598938874900341, "step": 12380 }, { "epoch": 1.4688796680497926, "grad_norm": 0.59375, "learning_rate": 0.00019404740256381386, "loss": 0.8505, "step": 12390 }, { "contrastive_loss": 3.877685546875, "epoch": 1.4688796680497926, "mse_loss": 0.07631499320268631, "step": 12390 }, { "epoch": 1.4700652045050386, "grad_norm": 0.4609375, "learning_rate": 0.00019403334559251105, "loss": 0.8506, "step": 12400 }, { "contrastive_loss": 3.94140625, "epoch": 1.4700652045050386, "mse_loss": 0.07957662642002106, "step": 12400 }, { "epoch": 1.4712507409602846, "grad_norm": 0.59765625, "learning_rate": 0.0001940192725534813, "loss": 0.8645, "step": 12410 }, { "contrastive_loss": 3.947998046875, "epoch": 1.4712507409602846, "mse_loss": 0.08312910050153732, "step": 12410 }, { "epoch": 1.4724362774155306, "grad_norm": 0.408203125, "learning_rate": 0.0001940051834491293, "loss": 0.8616, "step": 12420 }, { "contrastive_loss": 3.9122314453125, "epoch": 1.4724362774155306, "mse_loss": 0.0832282230257988, "step": 12420 }, { "epoch": 1.4736218138707766, "grad_norm": 0.4453125, "learning_rate": 0.00019399107828186248, "loss": 0.848, "step": 12430 }, { "contrastive_loss": 4.08740234375, "epoch": 1.4736218138707766, "mse_loss": 0.059665221720933914, "step": 12430 }, { "epoch": 1.4748073503260226, "grad_norm": 0.51171875, "learning_rate": 0.00019397695705409106, "loss": 0.8635, "step": 12440 }, { "contrastive_loss": 3.7890625, "epoch": 1.4748073503260226, "mse_loss": 0.06620240211486816, "step": 12440 }, { "epoch": 1.4759928867812686, "grad_norm": 0.578125, "learning_rate": 0.000193962819768228, "loss": 0.8503, "step": 12450 }, { "contrastive_loss": 3.86376953125, "epoch": 1.4759928867812686, "mse_loss": 0.06770701706409454, "step": 12450 }, { "epoch": 1.4771784232365146, "grad_norm": 0.51171875, "learning_rate": 0.00019394866642668887, "loss": 0.8456, "step": 12460 }, { "contrastive_loss": 3.8760986328125, "epoch": 1.4771784232365146, "mse_loss": 0.08840394765138626, "step": 12460 }, { "epoch": 1.4783639596917606, "grad_norm": 0.53125, "learning_rate": 0.00019393449703189214, "loss": 0.851, "step": 12470 }, { "contrastive_loss": 3.726318359375, "epoch": 1.4783639596917606, "mse_loss": 0.1020592600107193, "step": 12470 }, { "epoch": 1.4795494961470066, "grad_norm": 0.4296875, "learning_rate": 0.00019392031158625903, "loss": 0.8579, "step": 12480 }, { "contrastive_loss": 3.9742431640625, "epoch": 1.4795494961470066, "mse_loss": 0.05680998042225838, "step": 12480 }, { "epoch": 1.4807350326022526, "grad_norm": 0.427734375, "learning_rate": 0.00019390611009221335, "loss": 0.8517, "step": 12490 }, { "contrastive_loss": 3.7830810546875, "epoch": 1.4807350326022526, "mse_loss": 0.08100719004869461, "step": 12490 }, { "epoch": 1.4819205690574986, "grad_norm": 0.455078125, "learning_rate": 0.00019389189255218184, "loss": 0.8493, "step": 12500 }, { "contrastive_loss": 3.91943359375, "epoch": 1.4819205690574986, "mse_loss": 0.05279765650629997, "step": 12500 }, { "epoch": 1.4831061055127446, "grad_norm": 0.38671875, "learning_rate": 0.00019387765896859382, "loss": 0.8417, "step": 12510 }, { "contrastive_loss": 3.9117431640625, "epoch": 1.4831061055127446, "mse_loss": 0.09679164737462997, "step": 12510 }, { "epoch": 1.4842916419679906, "grad_norm": 0.546875, "learning_rate": 0.00019386340934388142, "loss": 0.8483, "step": 12520 }, { "contrastive_loss": 3.92919921875, "epoch": 1.4842916419679906, "mse_loss": 0.04731660708785057, "step": 12520 }, { "epoch": 1.4854771784232366, "grad_norm": 0.37109375, "learning_rate": 0.00019384914368047955, "loss": 0.8536, "step": 12530 }, { "contrastive_loss": 3.952392578125, "epoch": 1.4854771784232366, "mse_loss": 0.08897922188043594, "step": 12530 }, { "epoch": 1.4866627148784826, "grad_norm": 0.4296875, "learning_rate": 0.00019383486198082582, "loss": 0.8464, "step": 12540 }, { "contrastive_loss": 3.8927001953125, "epoch": 1.4866627148784826, "mse_loss": 0.07136952877044678, "step": 12540 }, { "epoch": 1.4878482513337286, "grad_norm": 0.423828125, "learning_rate": 0.00019382056424736054, "loss": 0.8466, "step": 12550 }, { "contrastive_loss": 3.8448486328125, "epoch": 1.4878482513337286, "mse_loss": 0.07500643283128738, "step": 12550 }, { "epoch": 1.4890337877889745, "grad_norm": 0.57421875, "learning_rate": 0.00019380625048252684, "loss": 0.8467, "step": 12560 }, { "contrastive_loss": 3.8953857421875, "epoch": 1.4890337877889745, "mse_loss": 0.05376279726624489, "step": 12560 }, { "epoch": 1.4902193242442205, "grad_norm": 0.458984375, "learning_rate": 0.00019379192068877055, "loss": 0.8527, "step": 12570 }, { "contrastive_loss": 3.8563232421875, "epoch": 1.4902193242442205, "mse_loss": 0.06281651556491852, "step": 12570 }, { "epoch": 1.4914048606994665, "grad_norm": 0.5234375, "learning_rate": 0.00019377757486854023, "loss": 0.8583, "step": 12580 }, { "contrastive_loss": 4.0106201171875, "epoch": 1.4914048606994665, "mse_loss": 0.04456176236271858, "step": 12580 }, { "epoch": 1.4925903971547125, "grad_norm": 0.4765625, "learning_rate": 0.00019376321302428718, "loss": 0.8493, "step": 12590 }, { "contrastive_loss": 3.86181640625, "epoch": 1.4925903971547125, "mse_loss": 0.0976976752281189, "step": 12590 }, { "epoch": 1.4937759336099585, "grad_norm": 0.6953125, "learning_rate": 0.00019374883515846546, "loss": 0.8512, "step": 12600 }, { "contrastive_loss": 3.9775390625, "epoch": 1.4937759336099585, "mse_loss": 0.0746171846985817, "step": 12600 }, { "epoch": 1.4949614700652045, "grad_norm": 0.54296875, "learning_rate": 0.0001937344412735318, "loss": 0.849, "step": 12610 }, { "contrastive_loss": 4.1470947265625, "epoch": 1.4949614700652045, "mse_loss": 0.09305913001298904, "step": 12610 }, { "epoch": 1.4961470065204505, "grad_norm": 0.6484375, "learning_rate": 0.00019372003137194582, "loss": 0.8608, "step": 12620 }, { "contrastive_loss": 3.860595703125, "epoch": 1.4961470065204505, "mse_loss": 0.07297004759311676, "step": 12620 }, { "epoch": 1.4973325429756965, "grad_norm": 0.478515625, "learning_rate": 0.00019370560545616973, "loss": 0.8582, "step": 12630 }, { "contrastive_loss": 4.04541015625, "epoch": 1.4973325429756965, "mse_loss": 0.05178570747375488, "step": 12630 }, { "epoch": 1.4985180794309425, "grad_norm": 0.53125, "learning_rate": 0.00019369116352866848, "loss": 0.8617, "step": 12640 }, { "contrastive_loss": 3.8077392578125, "epoch": 1.4985180794309425, "mse_loss": 0.07814175635576248, "step": 12640 }, { "epoch": 1.4997036158861885, "grad_norm": 0.39453125, "learning_rate": 0.0001936767055919099, "loss": 0.8606, "step": 12650 }, { "contrastive_loss": 3.87939453125, "epoch": 1.4997036158861885, "mse_loss": 0.06960202008485794, "step": 12650 }, { "epoch": 1.5008891523414345, "grad_norm": 0.41796875, "learning_rate": 0.00019366223164836433, "loss": 0.849, "step": 12660 }, { "contrastive_loss": 3.88037109375, "epoch": 1.5008891523414345, "mse_loss": 0.10441534966230392, "step": 12660 }, { "epoch": 1.5020746887966805, "grad_norm": 0.41015625, "learning_rate": 0.00019364774170050507, "loss": 0.8614, "step": 12670 }, { "contrastive_loss": 3.7916259765625, "epoch": 1.5020746887966805, "mse_loss": 0.04193255677819252, "step": 12670 }, { "epoch": 1.5032602252519265, "grad_norm": 0.486328125, "learning_rate": 0.00019363323575080803, "loss": 0.8412, "step": 12680 }, { "contrastive_loss": 3.82861328125, "epoch": 1.5032602252519265, "mse_loss": 0.055410031229257584, "step": 12680 }, { "epoch": 1.5044457617071725, "grad_norm": 0.46875, "learning_rate": 0.00019361871380175187, "loss": 0.8584, "step": 12690 }, { "contrastive_loss": 3.9051513671875, "epoch": 1.5044457617071725, "mse_loss": 0.0829123705625534, "step": 12690 }, { "epoch": 1.5056312981624185, "grad_norm": 0.490234375, "learning_rate": 0.00019360417585581802, "loss": 0.857, "step": 12700 }, { "contrastive_loss": 3.966064453125, "epoch": 1.5056312981624185, "mse_loss": 0.08380471169948578, "step": 12700 }, { "epoch": 1.5068168346176645, "grad_norm": 0.4609375, "learning_rate": 0.00019358962191549057, "loss": 0.8504, "step": 12710 }, { "contrastive_loss": 3.8929443359375, "epoch": 1.5068168346176645, "mse_loss": 0.08104854077100754, "step": 12710 }, { "epoch": 1.5080023710729105, "grad_norm": 0.498046875, "learning_rate": 0.00019357505198325643, "loss": 0.8568, "step": 12720 }, { "contrastive_loss": 4.032958984375, "epoch": 1.5080023710729105, "mse_loss": 0.06361814588308334, "step": 12720 }, { "epoch": 1.5091879075281565, "grad_norm": 0.4609375, "learning_rate": 0.00019356046606160517, "loss": 0.8638, "step": 12730 }, { "contrastive_loss": 3.799072265625, "epoch": 1.5091879075281565, "mse_loss": 0.0613502636551857, "step": 12730 }, { "epoch": 1.5103734439834025, "grad_norm": 0.455078125, "learning_rate": 0.00019354586415302918, "loss": 0.8438, "step": 12740 }, { "contrastive_loss": 3.8885498046875, "epoch": 1.5103734439834025, "mse_loss": 0.06513427942991257, "step": 12740 }, { "epoch": 1.5115589804386484, "grad_norm": 0.474609375, "learning_rate": 0.00019353124626002346, "loss": 0.8521, "step": 12750 }, { "contrastive_loss": 4.0079345703125, "epoch": 1.5115589804386484, "mse_loss": 0.06531250476837158, "step": 12750 }, { "epoch": 1.5127445168938944, "grad_norm": 0.3359375, "learning_rate": 0.00019351661238508586, "loss": 0.8524, "step": 12760 }, { "contrastive_loss": 4.1136474609375, "epoch": 1.5127445168938944, "mse_loss": 0.06254822015762329, "step": 12760 }, { "epoch": 1.5139300533491404, "grad_norm": 0.416015625, "learning_rate": 0.00019350196253071686, "loss": 0.8555, "step": 12770 }, { "contrastive_loss": 3.9461669921875, "epoch": 1.5139300533491404, "mse_loss": 0.07332195341587067, "step": 12770 }, { "epoch": 1.5151155898043864, "grad_norm": 0.4296875, "learning_rate": 0.00019348729669941975, "loss": 0.8585, "step": 12780 }, { "contrastive_loss": 3.7489013671875, "epoch": 1.5151155898043864, "mse_loss": 0.058685533702373505, "step": 12780 }, { "epoch": 1.5163011262596324, "grad_norm": 0.42578125, "learning_rate": 0.00019347261489370055, "loss": 0.8523, "step": 12790 }, { "contrastive_loss": 4.0582275390625, "epoch": 1.5163011262596324, "mse_loss": 0.06050369516015053, "step": 12790 }, { "epoch": 1.5174866627148784, "grad_norm": 0.3984375, "learning_rate": 0.00019345791711606795, "loss": 0.8553, "step": 12800 }, { "contrastive_loss": 3.9794921875, "epoch": 1.5174866627148784, "mse_loss": 0.08824530988931656, "step": 12800 }, { "epoch": 1.5186721991701244, "grad_norm": 0.486328125, "learning_rate": 0.00019344320336903335, "loss": 0.8606, "step": 12810 }, { "contrastive_loss": 3.856689453125, "epoch": 1.5186721991701244, "mse_loss": 0.06551641970872879, "step": 12810 }, { "epoch": 1.5198577356253704, "grad_norm": 0.435546875, "learning_rate": 0.00019342847365511097, "loss": 0.8565, "step": 12820 }, { "contrastive_loss": 3.9510498046875, "epoch": 1.5198577356253704, "mse_loss": 0.06320741772651672, "step": 12820 }, { "epoch": 1.5210432720806164, "grad_norm": 0.54296875, "learning_rate": 0.00019341372797681777, "loss": 0.8571, "step": 12830 }, { "contrastive_loss": 3.9368896484375, "epoch": 1.5210432720806164, "mse_loss": 0.0549398735165596, "step": 12830 }, { "epoch": 1.5222288085358624, "grad_norm": 0.458984375, "learning_rate": 0.00019339896633667329, "loss": 0.8494, "step": 12840 }, { "contrastive_loss": 4.194580078125, "epoch": 1.5222288085358624, "mse_loss": 0.07914268225431442, "step": 12840 }, { "epoch": 1.5234143449911084, "grad_norm": 0.439453125, "learning_rate": 0.00019338418873719994, "loss": 0.868, "step": 12850 }, { "contrastive_loss": 3.87548828125, "epoch": 1.5234143449911084, "mse_loss": 0.06993613392114639, "step": 12850 }, { "epoch": 1.5245998814463544, "grad_norm": 0.44140625, "learning_rate": 0.0001933693951809228, "loss": 0.8507, "step": 12860 }, { "contrastive_loss": 3.91064453125, "epoch": 1.5245998814463544, "mse_loss": 0.09226804226636887, "step": 12860 }, { "epoch": 1.5257854179016004, "grad_norm": 0.41796875, "learning_rate": 0.00019335458567036967, "loss": 0.8643, "step": 12870 }, { "contrastive_loss": 3.9281005859375, "epoch": 1.5257854179016004, "mse_loss": 0.05695611238479614, "step": 12870 }, { "epoch": 1.5269709543568464, "grad_norm": 0.365234375, "learning_rate": 0.00019333976020807114, "loss": 0.842, "step": 12880 }, { "contrastive_loss": 4.192626953125, "epoch": 1.5269709543568464, "mse_loss": 0.08715413510799408, "step": 12880 }, { "epoch": 1.5281564908120924, "grad_norm": 0.42578125, "learning_rate": 0.0001933249187965604, "loss": 0.8586, "step": 12890 }, { "contrastive_loss": 3.87890625, "epoch": 1.5281564908120924, "mse_loss": 0.055402159690856934, "step": 12890 }, { "epoch": 1.5293420272673384, "grad_norm": 0.431640625, "learning_rate": 0.0001933100614383735, "loss": 0.8423, "step": 12900 }, { "contrastive_loss": 3.909912109375, "epoch": 1.5293420272673384, "mse_loss": 0.0639616921544075, "step": 12900 }, { "epoch": 1.5305275637225844, "grad_norm": 0.392578125, "learning_rate": 0.00019329518813604912, "loss": 0.8454, "step": 12910 }, { "contrastive_loss": 4.07568359375, "epoch": 1.5305275637225844, "mse_loss": 0.05556568130850792, "step": 12910 }, { "epoch": 1.5317131001778304, "grad_norm": 0.423828125, "learning_rate": 0.00019328029889212873, "loss": 0.8641, "step": 12920 }, { "contrastive_loss": 4.0361328125, "epoch": 1.5317131001778304, "mse_loss": 0.0909353494644165, "step": 12920 }, { "epoch": 1.5328986366330764, "grad_norm": 0.4609375, "learning_rate": 0.00019326539370915645, "loss": 0.8596, "step": 12930 }, { "contrastive_loss": 3.8541259765625, "epoch": 1.5328986366330764, "mse_loss": 0.040919192135334015, "step": 12930 }, { "epoch": 1.5340841730883223, "grad_norm": 0.404296875, "learning_rate": 0.00019325047258967923, "loss": 0.8404, "step": 12940 }, { "contrastive_loss": 4.0126953125, "epoch": 1.5340841730883223, "mse_loss": 0.07221027463674545, "step": 12940 }, { "epoch": 1.5352697095435683, "grad_norm": 0.42578125, "learning_rate": 0.00019323553553624666, "loss": 0.8518, "step": 12950 }, { "contrastive_loss": 3.8653564453125, "epoch": 1.5352697095435683, "mse_loss": 0.0721910372376442, "step": 12950 }, { "epoch": 1.5364552459988143, "grad_norm": 0.546875, "learning_rate": 0.00019322058255141105, "loss": 0.8583, "step": 12960 }, { "contrastive_loss": 4.0244140625, "epoch": 1.5364552459988143, "mse_loss": 0.049060720950365067, "step": 12960 }, { "epoch": 1.5376407824540603, "grad_norm": 0.578125, "learning_rate": 0.00019320561363772747, "loss": 0.8575, "step": 12970 }, { "contrastive_loss": 3.926025390625, "epoch": 1.5376407824540603, "mse_loss": 0.06547469645738602, "step": 12970 }, { "epoch": 1.5388263189093063, "grad_norm": 0.50390625, "learning_rate": 0.0001931906287977537, "loss": 0.8568, "step": 12980 }, { "contrastive_loss": 4.0032958984375, "epoch": 1.5388263189093063, "mse_loss": 0.07884849607944489, "step": 12980 }, { "epoch": 1.5400118553645523, "grad_norm": 0.40234375, "learning_rate": 0.00019317562803405021, "loss": 0.8623, "step": 12990 }, { "contrastive_loss": 3.791748046875, "epoch": 1.5400118553645523, "mse_loss": 0.06761370599269867, "step": 12990 }, { "epoch": 1.5411973918197983, "grad_norm": 0.404296875, "learning_rate": 0.0001931606113491803, "loss": 0.8512, "step": 13000 }, { "contrastive_loss": 3.869873046875, "epoch": 1.5411973918197983, "mse_loss": 0.06582839787006378, "step": 13000 }, { "epoch": 1.5423829282750443, "grad_norm": 0.412109375, "learning_rate": 0.0001931455787457098, "loss": 0.8566, "step": 13010 }, { "contrastive_loss": 3.9310302734375, "epoch": 1.5423829282750443, "mse_loss": 0.05528441444039345, "step": 13010 }, { "epoch": 1.5435684647302903, "grad_norm": 0.625, "learning_rate": 0.0001931305302262075, "loss": 0.8521, "step": 13020 }, { "contrastive_loss": 4.0382080078125, "epoch": 1.5435684647302903, "mse_loss": 0.07745666801929474, "step": 13020 }, { "epoch": 1.5447540011855363, "grad_norm": 0.51171875, "learning_rate": 0.00019311546579324466, "loss": 0.8622, "step": 13030 }, { "contrastive_loss": 3.8258056640625, "epoch": 1.5447540011855363, "mse_loss": 0.06627541035413742, "step": 13030 }, { "epoch": 1.5459395376407823, "grad_norm": 0.40234375, "learning_rate": 0.00019310038544939544, "loss": 0.8392, "step": 13040 }, { "contrastive_loss": 3.9525146484375, "epoch": 1.5459395376407823, "mse_loss": 0.06256203353404999, "step": 13040 }, { "epoch": 1.5471250740960285, "grad_norm": 0.578125, "learning_rate": 0.00019308528919723665, "loss": 0.8465, "step": 13050 }, { "contrastive_loss": 4.01904296875, "epoch": 1.5471250740960285, "mse_loss": 0.07225262373685837, "step": 13050 }, { "epoch": 1.5483106105512745, "grad_norm": 0.4453125, "learning_rate": 0.00019307017703934783, "loss": 0.8502, "step": 13060 }, { "contrastive_loss": 3.9423828125, "epoch": 1.5483106105512745, "mse_loss": 0.06467950344085693, "step": 13060 }, { "epoch": 1.5494961470065205, "grad_norm": 0.419921875, "learning_rate": 0.0001930550489783112, "loss": 0.8499, "step": 13070 }, { "contrastive_loss": 3.993896484375, "epoch": 1.5494961470065205, "mse_loss": 0.06789369881153107, "step": 13070 }, { "epoch": 1.5506816834617665, "grad_norm": 0.54296875, "learning_rate": 0.00019303990501671182, "loss": 0.8599, "step": 13080 }, { "contrastive_loss": 3.7279052734375, "epoch": 1.5506816834617665, "mse_loss": 0.07367698103189468, "step": 13080 }, { "epoch": 1.5518672199170125, "grad_norm": 0.453125, "learning_rate": 0.00019302474515713725, "loss": 0.8467, "step": 13090 }, { "contrastive_loss": 3.9102783203125, "epoch": 1.5518672199170125, "mse_loss": 0.05999484658241272, "step": 13090 }, { "epoch": 1.5530527563722585, "grad_norm": 0.474609375, "learning_rate": 0.000193009569402178, "loss": 0.8582, "step": 13100 }, { "contrastive_loss": 3.9117431640625, "epoch": 1.5530527563722585, "mse_loss": 0.07294739782810211, "step": 13100 }, { "epoch": 1.5542382928275045, "grad_norm": 0.40625, "learning_rate": 0.00019299437775442715, "loss": 0.8519, "step": 13110 }, { "contrastive_loss": 4.00537109375, "epoch": 1.5542382928275045, "mse_loss": 0.04552203416824341, "step": 13110 }, { "epoch": 1.5554238292827505, "grad_norm": 0.51171875, "learning_rate": 0.00019297917021648056, "loss": 0.8543, "step": 13120 }, { "contrastive_loss": 3.8765869140625, "epoch": 1.5554238292827505, "mse_loss": 0.1099015325307846, "step": 13120 }, { "epoch": 1.5566093657379965, "grad_norm": 0.46875, "learning_rate": 0.00019296394679093674, "loss": 0.857, "step": 13130 }, { "contrastive_loss": 3.9403076171875, "epoch": 1.5566093657379965, "mse_loss": 0.048858873546123505, "step": 13130 }, { "epoch": 1.5577949021932425, "grad_norm": 0.458984375, "learning_rate": 0.00019294870748039702, "loss": 0.8465, "step": 13140 }, { "contrastive_loss": 3.9278564453125, "epoch": 1.5577949021932425, "mse_loss": 0.08653654158115387, "step": 13140 }, { "epoch": 1.5589804386484885, "grad_norm": 0.5, "learning_rate": 0.00019293345228746532, "loss": 0.8622, "step": 13150 }, { "contrastive_loss": 3.9324951171875, "epoch": 1.5589804386484885, "mse_loss": 0.05714127793908119, "step": 13150 }, { "epoch": 1.5601659751037344, "grad_norm": 0.458984375, "learning_rate": 0.00019291818121474835, "loss": 0.8566, "step": 13160 }, { "contrastive_loss": 3.911376953125, "epoch": 1.5601659751037344, "mse_loss": 0.07127918303012848, "step": 13160 }, { "epoch": 1.5613515115589804, "grad_norm": 0.50390625, "learning_rate": 0.00019290289426485556, "loss": 0.8489, "step": 13170 }, { "contrastive_loss": 3.9437255859375, "epoch": 1.5613515115589804, "mse_loss": 0.06702873855829239, "step": 13170 }, { "epoch": 1.5625370480142264, "grad_norm": 0.51171875, "learning_rate": 0.000192887591440399, "loss": 0.8638, "step": 13180 }, { "contrastive_loss": 3.9515380859375, "epoch": 1.5625370480142264, "mse_loss": 0.0688382014632225, "step": 13180 }, { "epoch": 1.5637225844694724, "grad_norm": 0.5859375, "learning_rate": 0.00019287227274399356, "loss": 0.8493, "step": 13190 }, { "contrastive_loss": 3.951171875, "epoch": 1.5637225844694724, "mse_loss": 0.06388626247644424, "step": 13190 }, { "epoch": 1.5649081209247184, "grad_norm": 0.42578125, "learning_rate": 0.00019285693817825677, "loss": 0.8636, "step": 13200 }, { "contrastive_loss": 3.857421875, "epoch": 1.5649081209247184, "mse_loss": 0.07116355746984482, "step": 13200 }, { "epoch": 1.5660936573799644, "grad_norm": 0.458984375, "learning_rate": 0.00019284158774580888, "loss": 0.8473, "step": 13210 }, { "contrastive_loss": 4.06689453125, "epoch": 1.5660936573799644, "mse_loss": 0.06996307522058487, "step": 13210 }, { "epoch": 1.5672791938352104, "grad_norm": 0.396484375, "learning_rate": 0.00019282622144927287, "loss": 0.8601, "step": 13220 }, { "contrastive_loss": 4.0101318359375, "epoch": 1.5672791938352104, "mse_loss": 0.0797244980931282, "step": 13220 }, { "epoch": 1.5684647302904564, "grad_norm": 0.47265625, "learning_rate": 0.00019281083929127444, "loss": 0.8623, "step": 13230 }, { "contrastive_loss": 3.8271484375, "epoch": 1.5684647302904564, "mse_loss": 0.05537368729710579, "step": 13230 }, { "epoch": 1.5696502667457024, "grad_norm": 0.478515625, "learning_rate": 0.00019279544127444193, "loss": 0.8536, "step": 13240 }, { "contrastive_loss": 3.848388671875, "epoch": 1.5696502667457024, "mse_loss": 0.07187171280384064, "step": 13240 }, { "epoch": 1.5708358032009484, "grad_norm": 0.53515625, "learning_rate": 0.00019278002740140648, "loss": 0.8529, "step": 13250 }, { "contrastive_loss": 3.82177734375, "epoch": 1.5708358032009484, "mse_loss": 0.06636353582143784, "step": 13250 }, { "epoch": 1.5720213396561944, "grad_norm": 0.55859375, "learning_rate": 0.0001927645976748019, "loss": 0.8575, "step": 13260 }, { "contrastive_loss": 3.9296875, "epoch": 1.5720213396561944, "mse_loss": 0.06554179638624191, "step": 13260 }, { "epoch": 1.5732068761114404, "grad_norm": 0.52734375, "learning_rate": 0.00019274915209726467, "loss": 0.8649, "step": 13270 }, { "contrastive_loss": 3.837646484375, "epoch": 1.5732068761114404, "mse_loss": 0.08416423946619034, "step": 13270 }, { "epoch": 1.5743924125666864, "grad_norm": 0.53515625, "learning_rate": 0.00019273369067143405, "loss": 0.8549, "step": 13280 }, { "contrastive_loss": 3.9197998046875, "epoch": 1.5743924125666864, "mse_loss": 0.059929944574832916, "step": 13280 }, { "epoch": 1.5755779490219324, "grad_norm": 0.458984375, "learning_rate": 0.00019271821339995199, "loss": 0.8591, "step": 13290 }, { "contrastive_loss": 3.827880859375, "epoch": 1.5755779490219324, "mse_loss": 0.06158678978681564, "step": 13290 }, { "epoch": 1.5767634854771784, "grad_norm": 0.40625, "learning_rate": 0.00019270272028546308, "loss": 0.8599, "step": 13300 }, { "contrastive_loss": 4.003662109375, "epoch": 1.5767634854771784, "mse_loss": 0.06682686507701874, "step": 13300 }, { "epoch": 1.5779490219324244, "grad_norm": 0.380859375, "learning_rate": 0.0001926872113306147, "loss": 0.8466, "step": 13310 }, { "contrastive_loss": 3.8837890625, "epoch": 1.5779490219324244, "mse_loss": 0.0747826099395752, "step": 13310 }, { "epoch": 1.5791345583876706, "grad_norm": 0.40625, "learning_rate": 0.0001926716865380569, "loss": 0.8523, "step": 13320 }, { "contrastive_loss": 3.8978271484375, "epoch": 1.5791345583876706, "mse_loss": 0.08159596472978592, "step": 13320 }, { "epoch": 1.5803200948429166, "grad_norm": 0.4296875, "learning_rate": 0.00019265614591044248, "loss": 0.8466, "step": 13330 }, { "contrastive_loss": 3.782470703125, "epoch": 1.5803200948429166, "mse_loss": 0.07001477479934692, "step": 13330 }, { "epoch": 1.5815056312981626, "grad_norm": 0.4453125, "learning_rate": 0.00019264058945042684, "loss": 0.8484, "step": 13340 }, { "contrastive_loss": 3.907470703125, "epoch": 1.5815056312981626, "mse_loss": 0.06857410818338394, "step": 13340 }, { "epoch": 1.5826911677534086, "grad_norm": 0.474609375, "learning_rate": 0.00019262501716066818, "loss": 0.8425, "step": 13350 }, { "contrastive_loss": 3.900634765625, "epoch": 1.5826911677534086, "mse_loss": 0.07056637108325958, "step": 13350 }, { "epoch": 1.5838767042086546, "grad_norm": 0.458984375, "learning_rate": 0.00019260942904382743, "loss": 0.863, "step": 13360 }, { "contrastive_loss": 3.889892578125, "epoch": 1.5838767042086546, "mse_loss": 0.10108030587434769, "step": 13360 }, { "epoch": 1.5850622406639006, "grad_norm": 0.45703125, "learning_rate": 0.0001925938251025681, "loss": 0.8419, "step": 13370 }, { "contrastive_loss": 3.8927001953125, "epoch": 1.5850622406639006, "mse_loss": 0.07643011957406998, "step": 13370 }, { "epoch": 1.5862477771191466, "grad_norm": 0.37890625, "learning_rate": 0.0001925782053395565, "loss": 0.855, "step": 13380 }, { "contrastive_loss": 3.91162109375, "epoch": 1.5862477771191466, "mse_loss": 0.07272636890411377, "step": 13380 }, { "epoch": 1.5874333135743925, "grad_norm": 0.640625, "learning_rate": 0.00019256256975746166, "loss": 0.8542, "step": 13390 }, { "contrastive_loss": 3.9415283203125, "epoch": 1.5874333135743925, "mse_loss": 0.06325452029705048, "step": 13390 }, { "epoch": 1.5886188500296385, "grad_norm": 0.388671875, "learning_rate": 0.00019254691835895522, "loss": 0.8434, "step": 13400 }, { "contrastive_loss": 3.8128662109375, "epoch": 1.5886188500296385, "mse_loss": 0.08217180520296097, "step": 13400 }, { "epoch": 1.5898043864848845, "grad_norm": 0.404296875, "learning_rate": 0.00019253125114671157, "loss": 0.8463, "step": 13410 }, { "contrastive_loss": 3.7801513671875, "epoch": 1.5898043864848845, "mse_loss": 0.07105619460344315, "step": 13410 }, { "epoch": 1.5909899229401305, "grad_norm": 0.44921875, "learning_rate": 0.00019251556812340787, "loss": 0.8448, "step": 13420 }, { "contrastive_loss": 3.9520263671875, "epoch": 1.5909899229401305, "mse_loss": 0.09077896922826767, "step": 13420 }, { "epoch": 1.5921754593953765, "grad_norm": 0.482421875, "learning_rate": 0.00019249986929172386, "loss": 0.8688, "step": 13430 }, { "contrastive_loss": 4.0125732421875, "epoch": 1.5921754593953765, "mse_loss": 0.09169314801692963, "step": 13430 }, { "epoch": 1.5933609958506225, "grad_norm": 0.453125, "learning_rate": 0.0001924841546543421, "loss": 0.8676, "step": 13440 }, { "contrastive_loss": 3.857666015625, "epoch": 1.5933609958506225, "mse_loss": 0.05610060691833496, "step": 13440 }, { "epoch": 1.5945465323058685, "grad_norm": 0.412109375, "learning_rate": 0.00019246842421394772, "loss": 0.8642, "step": 13450 }, { "contrastive_loss": 3.99072265625, "epoch": 1.5945465323058685, "mse_loss": 0.06533140689134598, "step": 13450 }, { "epoch": 1.5957320687611145, "grad_norm": 0.48046875, "learning_rate": 0.00019245267797322868, "loss": 0.8554, "step": 13460 }, { "contrastive_loss": 3.983154296875, "epoch": 1.5957320687611145, "mse_loss": 0.07701272517442703, "step": 13460 }, { "epoch": 1.5969176052163605, "grad_norm": 0.4453125, "learning_rate": 0.00019243691593487556, "loss": 0.8589, "step": 13470 }, { "contrastive_loss": 3.8167724609375, "epoch": 1.5969176052163605, "mse_loss": 0.05271485820412636, "step": 13470 }, { "epoch": 1.5981031416716065, "grad_norm": 0.4453125, "learning_rate": 0.00019242113810158165, "loss": 0.8471, "step": 13480 }, { "contrastive_loss": 4.069091796875, "epoch": 1.5981031416716065, "mse_loss": 0.09566613286733627, "step": 13480 }, { "epoch": 1.5992886781268525, "grad_norm": 0.5234375, "learning_rate": 0.00019240534447604297, "loss": 0.8602, "step": 13490 }, { "contrastive_loss": 3.8446044921875, "epoch": 1.5992886781268525, "mse_loss": 0.09627556055784225, "step": 13490 }, { "epoch": 1.6004742145820985, "grad_norm": 0.419921875, "learning_rate": 0.00019238953506095822, "loss": 0.8433, "step": 13500 }, { "contrastive_loss": 3.9423828125, "epoch": 1.6004742145820985, "mse_loss": 0.08442274481058121, "step": 13500 }, { "epoch": 1.6016597510373445, "grad_norm": 0.462890625, "learning_rate": 0.00019237370985902876, "loss": 0.855, "step": 13510 }, { "contrastive_loss": 3.9293212890625, "epoch": 1.6016597510373445, "mse_loss": 0.06374462693929672, "step": 13510 }, { "epoch": 1.6028452874925905, "grad_norm": 0.408203125, "learning_rate": 0.00019235786887295876, "loss": 0.8439, "step": 13520 }, { "contrastive_loss": 3.959716796875, "epoch": 1.6028452874925905, "mse_loss": 0.07798861712217331, "step": 13520 }, { "epoch": 1.6040308239478365, "grad_norm": 0.390625, "learning_rate": 0.00019234201210545493, "loss": 0.8457, "step": 13530 }, { "contrastive_loss": 3.9144287109375, "epoch": 1.6040308239478365, "mse_loss": 0.08149518072605133, "step": 13530 }, { "epoch": 1.6052163604030825, "grad_norm": 0.55859375, "learning_rate": 0.00019232613955922677, "loss": 0.8556, "step": 13540 }, { "contrastive_loss": 3.82470703125, "epoch": 1.6052163604030825, "mse_loss": 0.09039369970560074, "step": 13540 }, { "epoch": 1.6064018968583285, "grad_norm": 0.43359375, "learning_rate": 0.00019231025123698652, "loss": 0.8587, "step": 13550 }, { "contrastive_loss": 3.8824462890625, "epoch": 1.6064018968583285, "mse_loss": 0.06833861768245697, "step": 13550 }, { "epoch": 1.6075874333135745, "grad_norm": 0.50390625, "learning_rate": 0.000192294347141449, "loss": 0.8598, "step": 13560 }, { "contrastive_loss": 3.8662109375, "epoch": 1.6075874333135745, "mse_loss": 0.052454907447099686, "step": 13560 }, { "epoch": 1.6087729697688204, "grad_norm": 0.54296875, "learning_rate": 0.00019227842727533183, "loss": 0.8465, "step": 13570 }, { "contrastive_loss": 3.8218994140625, "epoch": 1.6087729697688204, "mse_loss": 0.09069063514471054, "step": 13570 }, { "epoch": 1.6099585062240664, "grad_norm": 0.443359375, "learning_rate": 0.00019226249164135527, "loss": 0.8535, "step": 13580 }, { "contrastive_loss": 4.081787109375, "epoch": 1.6099585062240664, "mse_loss": 0.08725760132074356, "step": 13580 }, { "epoch": 1.6111440426793124, "grad_norm": 0.400390625, "learning_rate": 0.00019224654024224225, "loss": 0.8527, "step": 13590 }, { "contrastive_loss": 3.9442138671875, "epoch": 1.6111440426793124, "mse_loss": 0.054495301097631454, "step": 13590 }, { "epoch": 1.6123295791345584, "grad_norm": 0.5234375, "learning_rate": 0.00019223057308071843, "loss": 0.8541, "step": 13600 }, { "contrastive_loss": 3.821044921875, "epoch": 1.6123295791345584, "mse_loss": 0.0695209801197052, "step": 13600 }, { "epoch": 1.6135151155898044, "grad_norm": 0.50390625, "learning_rate": 0.00019221459015951223, "loss": 0.8397, "step": 13610 }, { "contrastive_loss": 3.8741455078125, "epoch": 1.6135151155898044, "mse_loss": 0.07824473828077316, "step": 13610 }, { "epoch": 1.6147006520450504, "grad_norm": 0.484375, "learning_rate": 0.00019219859148135462, "loss": 0.857, "step": 13620 }, { "contrastive_loss": 3.8983154296875, "epoch": 1.6147006520450504, "mse_loss": 0.08800840377807617, "step": 13620 }, { "epoch": 1.6158861885002964, "grad_norm": 0.359375, "learning_rate": 0.00019218257704897934, "loss": 0.8447, "step": 13630 }, { "contrastive_loss": 3.936279296875, "epoch": 1.6158861885002964, "mse_loss": 0.06815426051616669, "step": 13630 }, { "epoch": 1.6170717249555424, "grad_norm": 0.44140625, "learning_rate": 0.00019216654686512286, "loss": 0.8652, "step": 13640 }, { "contrastive_loss": 3.8792724609375, "epoch": 1.6170717249555424, "mse_loss": 0.06995698064565659, "step": 13640 }, { "epoch": 1.6182572614107884, "grad_norm": 0.46484375, "learning_rate": 0.0001921505009325243, "loss": 0.855, "step": 13650 }, { "contrastive_loss": 3.9871826171875, "epoch": 1.6182572614107884, "mse_loss": 0.09658553451299667, "step": 13650 }, { "epoch": 1.6194427978660344, "grad_norm": 0.443359375, "learning_rate": 0.00019213443925392544, "loss": 0.8507, "step": 13660 }, { "contrastive_loss": 3.929931640625, "epoch": 1.6194427978660344, "mse_loss": 0.08380109816789627, "step": 13660 }, { "epoch": 1.6206283343212804, "grad_norm": 0.5, "learning_rate": 0.0001921183618320708, "loss": 0.8498, "step": 13670 }, { "contrastive_loss": 4.003662109375, "epoch": 1.6206283343212804, "mse_loss": 0.08286786824464798, "step": 13670 }, { "epoch": 1.6218138707765264, "grad_norm": 0.462890625, "learning_rate": 0.00019210226866970756, "loss": 0.8535, "step": 13680 }, { "contrastive_loss": 3.9744873046875, "epoch": 1.6218138707765264, "mse_loss": 0.06522519886493683, "step": 13680 }, { "epoch": 1.6229994072317724, "grad_norm": 0.51171875, "learning_rate": 0.00019208615976958559, "loss": 0.8453, "step": 13690 }, { "contrastive_loss": 3.8770751953125, "epoch": 1.6229994072317724, "mse_loss": 0.10590272396802902, "step": 13690 }, { "epoch": 1.6241849436870184, "grad_norm": 0.546875, "learning_rate": 0.0001920700351344575, "loss": 0.8606, "step": 13700 }, { "contrastive_loss": 3.967529296875, "epoch": 1.6241849436870184, "mse_loss": 0.08122245222330093, "step": 13700 }, { "epoch": 1.6253704801422644, "grad_norm": 0.37109375, "learning_rate": 0.00019205389476707854, "loss": 0.8515, "step": 13710 }, { "contrastive_loss": 3.7652587890625, "epoch": 1.6253704801422644, "mse_loss": 0.05896469205617905, "step": 13710 }, { "epoch": 1.6265560165975104, "grad_norm": 0.4296875, "learning_rate": 0.00019203773867020662, "loss": 0.8428, "step": 13720 }, { "contrastive_loss": 3.77099609375, "epoch": 1.6265560165975104, "mse_loss": 0.07878490537405014, "step": 13720 }, { "epoch": 1.6277415530527564, "grad_norm": 0.365234375, "learning_rate": 0.0001920215668466024, "loss": 0.8508, "step": 13730 }, { "contrastive_loss": 3.9803466796875, "epoch": 1.6277415530527564, "mse_loss": 0.07198692858219147, "step": 13730 }, { "epoch": 1.6289270895080024, "grad_norm": 0.51171875, "learning_rate": 0.0001920053792990292, "loss": 0.8561, "step": 13740 }, { "contrastive_loss": 3.9395751953125, "epoch": 1.6289270895080024, "mse_loss": 0.1018441915512085, "step": 13740 }, { "epoch": 1.6301126259632484, "grad_norm": 0.6328125, "learning_rate": 0.00019198917603025303, "loss": 0.8491, "step": 13750 }, { "contrastive_loss": 3.8663330078125, "epoch": 1.6301126259632484, "mse_loss": 0.045744847506284714, "step": 13750 }, { "epoch": 1.6312981624184943, "grad_norm": 0.4765625, "learning_rate": 0.00019197295704304258, "loss": 0.8553, "step": 13760 }, { "contrastive_loss": 3.9730224609375, "epoch": 1.6312981624184943, "mse_loss": 0.06238583102822304, "step": 13760 }, { "epoch": 1.6324836988737403, "grad_norm": 0.62890625, "learning_rate": 0.00019195672234016925, "loss": 0.8472, "step": 13770 }, { "contrastive_loss": 3.8304443359375, "epoch": 1.6324836988737403, "mse_loss": 0.07476828247308731, "step": 13770 }, { "epoch": 1.6336692353289863, "grad_norm": 0.47265625, "learning_rate": 0.00019194047192440711, "loss": 0.8512, "step": 13780 }, { "contrastive_loss": 3.9979248046875, "epoch": 1.6336692353289863, "mse_loss": 0.06423196941614151, "step": 13780 }, { "epoch": 1.6348547717842323, "grad_norm": 0.4296875, "learning_rate": 0.00019192420579853287, "loss": 0.8543, "step": 13790 }, { "contrastive_loss": 3.986083984375, "epoch": 1.6348547717842323, "mse_loss": 0.06288871169090271, "step": 13790 }, { "epoch": 1.6360403082394783, "grad_norm": 0.474609375, "learning_rate": 0.000191907923965326, "loss": 0.853, "step": 13800 }, { "contrastive_loss": 3.8917236328125, "epoch": 1.6360403082394783, "mse_loss": 0.09297798573970795, "step": 13800 }, { "epoch": 1.6372258446947243, "grad_norm": 0.58203125, "learning_rate": 0.00019189162642756861, "loss": 0.8639, "step": 13810 }, { "contrastive_loss": 4.0479736328125, "epoch": 1.6372258446947243, "mse_loss": 0.06384176015853882, "step": 13810 }, { "epoch": 1.6384113811499703, "grad_norm": 0.4296875, "learning_rate": 0.00019187531318804553, "loss": 0.8506, "step": 13820 }, { "contrastive_loss": 3.938720703125, "epoch": 1.6384113811499703, "mse_loss": 0.1234014704823494, "step": 13820 }, { "epoch": 1.6395969176052163, "grad_norm": 0.42578125, "learning_rate": 0.0001918589842495442, "loss": 0.8644, "step": 13830 }, { "contrastive_loss": 3.9246826171875, "epoch": 1.6395969176052163, "mse_loss": 0.0632701888680458, "step": 13830 }, { "epoch": 1.6407824540604623, "grad_norm": 0.470703125, "learning_rate": 0.0001918426396148548, "loss": 0.8501, "step": 13840 }, { "contrastive_loss": 3.8470458984375, "epoch": 1.6407824540604623, "mse_loss": 0.06153735890984535, "step": 13840 }, { "epoch": 1.6419679905157083, "grad_norm": 0.5625, "learning_rate": 0.0001918262792867702, "loss": 0.8449, "step": 13850 }, { "contrastive_loss": 4.043701171875, "epoch": 1.6419679905157083, "mse_loss": 0.10718902200460434, "step": 13850 }, { "epoch": 1.6431535269709543, "grad_norm": 0.470703125, "learning_rate": 0.00019180990326808593, "loss": 0.859, "step": 13860 }, { "contrastive_loss": 3.92138671875, "epoch": 1.6431535269709543, "mse_loss": 0.0660465732216835, "step": 13860 }, { "epoch": 1.6443390634262003, "grad_norm": 0.41796875, "learning_rate": 0.00019179351156160018, "loss": 0.8504, "step": 13870 }, { "contrastive_loss": 3.928466796875, "epoch": 1.6443390634262003, "mse_loss": 0.054838161915540695, "step": 13870 }, { "epoch": 1.6455245998814463, "grad_norm": 0.44140625, "learning_rate": 0.00019177710417011388, "loss": 0.8558, "step": 13880 }, { "contrastive_loss": 3.800048828125, "epoch": 1.6455245998814463, "mse_loss": 0.09777705371379852, "step": 13880 }, { "epoch": 1.6467101363366923, "grad_norm": 0.5234375, "learning_rate": 0.00019176068109643058, "loss": 0.8608, "step": 13890 }, { "contrastive_loss": 4.033935546875, "epoch": 1.6467101363366923, "mse_loss": 0.06676329672336578, "step": 13890 }, { "epoch": 1.6478956727919383, "grad_norm": 0.6484375, "learning_rate": 0.00019174424234335652, "loss": 0.8578, "step": 13900 }, { "contrastive_loss": 3.9844970703125, "epoch": 1.6478956727919383, "mse_loss": 0.07064718753099442, "step": 13900 }, { "epoch": 1.6490812092471843, "grad_norm": 0.45703125, "learning_rate": 0.00019172778791370066, "loss": 0.8413, "step": 13910 }, { "contrastive_loss": 3.992919921875, "epoch": 1.6490812092471843, "mse_loss": 0.05984940752387047, "step": 13910 }, { "epoch": 1.6502667457024303, "grad_norm": 0.466796875, "learning_rate": 0.00019171131781027466, "loss": 0.8581, "step": 13920 }, { "contrastive_loss": 3.851806640625, "epoch": 1.6502667457024303, "mse_loss": 0.06104495748877525, "step": 13920 }, { "epoch": 1.6514522821576763, "grad_norm": 0.52734375, "learning_rate": 0.00019169483203589272, "loss": 0.8556, "step": 13930 }, { "contrastive_loss": 3.89306640625, "epoch": 1.6514522821576763, "mse_loss": 0.06364674866199493, "step": 13930 }, { "epoch": 1.6526378186129222, "grad_norm": 0.50390625, "learning_rate": 0.0001916783305933718, "loss": 0.8554, "step": 13940 }, { "contrastive_loss": 4.01171875, "epoch": 1.6526378186129222, "mse_loss": 0.09701184183359146, "step": 13940 }, { "epoch": 1.6538233550681682, "grad_norm": 0.396484375, "learning_rate": 0.00019166181348553166, "loss": 0.8622, "step": 13950 }, { "contrastive_loss": 3.7962646484375, "epoch": 1.6538233550681682, "mse_loss": 0.06022895127534866, "step": 13950 }, { "epoch": 1.6550088915234142, "grad_norm": 0.462890625, "learning_rate": 0.00019164528071519452, "loss": 0.8433, "step": 13960 }, { "contrastive_loss": 3.8699951171875, "epoch": 1.6550088915234142, "mse_loss": 0.060904767364263535, "step": 13960 }, { "epoch": 1.6561944279786602, "grad_norm": 0.59765625, "learning_rate": 0.0001916287322851854, "loss": 0.8372, "step": 13970 }, { "contrastive_loss": 3.851806640625, "epoch": 1.6561944279786602, "mse_loss": 0.08179887384176254, "step": 13970 }, { "epoch": 1.6573799644339062, "grad_norm": 0.408203125, "learning_rate": 0.00019161216819833202, "loss": 0.8483, "step": 13980 }, { "contrastive_loss": 3.9366455078125, "epoch": 1.6573799644339062, "mse_loss": 0.08299632370471954, "step": 13980 }, { "epoch": 1.6585655008891522, "grad_norm": 0.4296875, "learning_rate": 0.00019159558845746467, "loss": 0.8587, "step": 13990 }, { "contrastive_loss": 3.967529296875, "epoch": 1.6585655008891522, "mse_loss": 0.049431659281253815, "step": 13990 }, { "epoch": 1.6597510373443982, "grad_norm": 0.482421875, "learning_rate": 0.00019157899306541639, "loss": 0.8401, "step": 14000 }, { "contrastive_loss": 3.9368896484375, "epoch": 1.6597510373443982, "mse_loss": 0.03789582476019859, "step": 14000 }, { "epoch": 1.6609365737996442, "grad_norm": 0.5703125, "learning_rate": 0.00019156238202502288, "loss": 0.8541, "step": 14010 }, { "contrastive_loss": 3.97705078125, "epoch": 1.6609365737996442, "mse_loss": 0.05516493692994118, "step": 14010 }, { "epoch": 1.6621221102548902, "grad_norm": 0.60546875, "learning_rate": 0.00019154575533912254, "loss": 0.865, "step": 14020 }, { "contrastive_loss": 3.892578125, "epoch": 1.6621221102548902, "mse_loss": 0.07224959880113602, "step": 14020 }, { "epoch": 1.6633076467101362, "grad_norm": 0.490234375, "learning_rate": 0.0001915291130105564, "loss": 0.8553, "step": 14030 }, { "contrastive_loss": 3.7947998046875, "epoch": 1.6633076467101362, "mse_loss": 0.08177696913480759, "step": 14030 }, { "epoch": 1.6644931831653822, "grad_norm": 0.435546875, "learning_rate": 0.00019151245504216814, "loss": 0.8423, "step": 14040 }, { "contrastive_loss": 3.9822998046875, "epoch": 1.6644931831653822, "mse_loss": 0.06199202686548233, "step": 14040 }, { "epoch": 1.6656787196206282, "grad_norm": 0.44140625, "learning_rate": 0.0001914957814368042, "loss": 0.8502, "step": 14050 }, { "contrastive_loss": 3.8514404296875, "epoch": 1.6656787196206282, "mse_loss": 0.06862123310565948, "step": 14050 }, { "epoch": 1.6668642560758742, "grad_norm": 0.51953125, "learning_rate": 0.00019147909219731363, "loss": 0.8511, "step": 14060 }, { "contrastive_loss": 3.9000244140625, "epoch": 1.6668642560758742, "mse_loss": 0.05599146708846092, "step": 14060 }, { "epoch": 1.6680497925311202, "grad_norm": 0.578125, "learning_rate": 0.00019146238732654816, "loss": 0.8555, "step": 14070 }, { "contrastive_loss": 3.879638671875, "epoch": 1.6680497925311202, "mse_loss": 0.0989062637090683, "step": 14070 }, { "epoch": 1.6692353289863662, "grad_norm": 0.466796875, "learning_rate": 0.0001914456668273622, "loss": 0.8492, "step": 14080 }, { "contrastive_loss": 3.8974609375, "epoch": 1.6692353289863662, "mse_loss": 0.04407254979014397, "step": 14080 }, { "epoch": 1.6704208654416122, "grad_norm": 0.45703125, "learning_rate": 0.00019142893070261282, "loss": 0.8492, "step": 14090 }, { "contrastive_loss": 3.8809814453125, "epoch": 1.6704208654416122, "mse_loss": 0.0635911300778389, "step": 14090 }, { "epoch": 1.6716064018968582, "grad_norm": 0.51171875, "learning_rate": 0.00019141217895515976, "loss": 0.8577, "step": 14100 }, { "contrastive_loss": 3.9801025390625, "epoch": 1.6716064018968582, "mse_loss": 0.05430155247449875, "step": 14100 }, { "epoch": 1.6727919383521044, "grad_norm": 0.42578125, "learning_rate": 0.00019139541158786548, "loss": 0.8427, "step": 14110 }, { "contrastive_loss": 3.8817138671875, "epoch": 1.6727919383521044, "mse_loss": 0.04576433077454567, "step": 14110 }, { "epoch": 1.6739774748073504, "grad_norm": 0.5, "learning_rate": 0.000191378628603595, "loss": 0.8487, "step": 14120 }, { "contrastive_loss": 3.830078125, "epoch": 1.6739774748073504, "mse_loss": 0.06519533693790436, "step": 14120 }, { "epoch": 1.6751630112625964, "grad_norm": 0.58984375, "learning_rate": 0.00019136183000521611, "loss": 0.84, "step": 14130 }, { "contrastive_loss": 3.9481201171875, "epoch": 1.6751630112625964, "mse_loss": 0.053990889340639114, "step": 14130 }, { "epoch": 1.6763485477178424, "grad_norm": 0.58203125, "learning_rate": 0.00019134501579559922, "loss": 0.8515, "step": 14140 }, { "contrastive_loss": 3.8936767578125, "epoch": 1.6763485477178424, "mse_loss": 0.05947575345635414, "step": 14140 }, { "epoch": 1.6775340841730884, "grad_norm": 0.447265625, "learning_rate": 0.00019132818597761744, "loss": 0.85, "step": 14150 }, { "contrastive_loss": 3.841064453125, "epoch": 1.6775340841730884, "mse_loss": 0.06887777149677277, "step": 14150 }, { "epoch": 1.6787196206283344, "grad_norm": 0.458984375, "learning_rate": 0.0001913113405541465, "loss": 0.844, "step": 14160 }, { "contrastive_loss": 3.93896484375, "epoch": 1.6787196206283344, "mse_loss": 0.07047151774168015, "step": 14160 }, { "epoch": 1.6799051570835803, "grad_norm": 0.35546875, "learning_rate": 0.0001912944795280648, "loss": 0.8554, "step": 14170 }, { "contrastive_loss": 3.98583984375, "epoch": 1.6799051570835803, "mse_loss": 0.05508458614349365, "step": 14170 }, { "epoch": 1.6810906935388263, "grad_norm": 0.58984375, "learning_rate": 0.0001912776029022535, "loss": 0.8569, "step": 14180 }, { "contrastive_loss": 3.9920654296875, "epoch": 1.6810906935388263, "mse_loss": 0.04984433576464653, "step": 14180 }, { "epoch": 1.6822762299940723, "grad_norm": 0.546875, "learning_rate": 0.0001912607106795963, "loss": 0.8487, "step": 14190 }, { "contrastive_loss": 4.0806884765625, "epoch": 1.6822762299940723, "mse_loss": 0.0708041861653328, "step": 14190 }, { "epoch": 1.6834617664493183, "grad_norm": 0.4140625, "learning_rate": 0.00019124380286297962, "loss": 0.8506, "step": 14200 }, { "contrastive_loss": 3.9193115234375, "epoch": 1.6834617664493183, "mse_loss": 0.09510374814271927, "step": 14200 }, { "epoch": 1.6846473029045643, "grad_norm": 0.474609375, "learning_rate": 0.00019122687945529254, "loss": 0.851, "step": 14210 }, { "contrastive_loss": 3.966552734375, "epoch": 1.6846473029045643, "mse_loss": 0.07777656614780426, "step": 14210 }, { "epoch": 1.6858328393598103, "grad_norm": 0.5546875, "learning_rate": 0.00019120994045942685, "loss": 0.8611, "step": 14220 }, { "contrastive_loss": 4.0279541015625, "epoch": 1.6858328393598103, "mse_loss": 0.07830112427473068, "step": 14220 }, { "epoch": 1.6870183758150563, "grad_norm": 0.427734375, "learning_rate": 0.00019119298587827693, "loss": 0.8523, "step": 14230 }, { "contrastive_loss": 3.91748046875, "epoch": 1.6870183758150563, "mse_loss": 0.0754893347620964, "step": 14230 }, { "epoch": 1.6882039122703023, "grad_norm": 0.412109375, "learning_rate": 0.00019117601571473985, "loss": 0.8482, "step": 14240 }, { "contrastive_loss": 3.8985595703125, "epoch": 1.6882039122703023, "mse_loss": 0.07894109934568405, "step": 14240 }, { "epoch": 1.6893894487255483, "grad_norm": 0.474609375, "learning_rate": 0.00019115902997171534, "loss": 0.8548, "step": 14250 }, { "contrastive_loss": 3.8023681640625, "epoch": 1.6893894487255483, "mse_loss": 0.08197259902954102, "step": 14250 }, { "epoch": 1.6905749851807943, "grad_norm": 0.51171875, "learning_rate": 0.00019114202865210586, "loss": 0.8514, "step": 14260 }, { "contrastive_loss": 3.892333984375, "epoch": 1.6905749851807943, "mse_loss": 0.10331149399280548, "step": 14260 }, { "epoch": 1.6917605216360403, "grad_norm": 0.466796875, "learning_rate": 0.00019112501175881636, "loss": 0.8423, "step": 14270 }, { "contrastive_loss": 4.0291748046875, "epoch": 1.6917605216360403, "mse_loss": 0.06560202687978745, "step": 14270 }, { "epoch": 1.6929460580912863, "grad_norm": 0.43359375, "learning_rate": 0.00019110797929475468, "loss": 0.8569, "step": 14280 }, { "contrastive_loss": 3.866943359375, "epoch": 1.6929460580912863, "mse_loss": 0.046642277389764786, "step": 14280 }, { "epoch": 1.6941315945465323, "grad_norm": 0.4296875, "learning_rate": 0.0001910909312628311, "loss": 0.8448, "step": 14290 }, { "contrastive_loss": 3.9287109375, "epoch": 1.6941315945465323, "mse_loss": 0.07592425495386124, "step": 14290 }, { "epoch": 1.6953171310017783, "grad_norm": 0.43359375, "learning_rate": 0.00019107386766595874, "loss": 0.8553, "step": 14300 }, { "contrastive_loss": 3.8939208984375, "epoch": 1.6953171310017783, "mse_loss": 0.05716237798333168, "step": 14300 }, { "epoch": 1.6965026674570243, "grad_norm": 0.404296875, "learning_rate": 0.00019105678850705327, "loss": 0.8401, "step": 14310 }, { "contrastive_loss": 3.77490234375, "epoch": 1.6965026674570243, "mse_loss": 0.062194645404815674, "step": 14310 }, { "epoch": 1.6976882039122703, "grad_norm": 0.51171875, "learning_rate": 0.00019103969378903303, "loss": 0.8588, "step": 14320 }, { "contrastive_loss": 3.8026123046875, "epoch": 1.6976882039122703, "mse_loss": 0.07476552575826645, "step": 14320 }, { "epoch": 1.6988737403675163, "grad_norm": 0.5, "learning_rate": 0.00019102258351481907, "loss": 0.8507, "step": 14330 }, { "contrastive_loss": 3.8948974609375, "epoch": 1.6988737403675163, "mse_loss": 0.07153185456991196, "step": 14330 }, { "epoch": 1.7000592768227623, "grad_norm": 0.5234375, "learning_rate": 0.00019100545768733509, "loss": 0.8561, "step": 14340 }, { "contrastive_loss": 4.053466796875, "epoch": 1.7000592768227623, "mse_loss": 0.06124896556138992, "step": 14340 }, { "epoch": 1.7012448132780082, "grad_norm": 0.44140625, "learning_rate": 0.00019098831630950738, "loss": 0.8537, "step": 14350 }, { "contrastive_loss": 3.8363037109375, "epoch": 1.7012448132780082, "mse_loss": 0.06162666901946068, "step": 14350 }, { "epoch": 1.7024303497332542, "grad_norm": 0.447265625, "learning_rate": 0.00019097115938426494, "loss": 0.8459, "step": 14360 }, { "contrastive_loss": 3.8465576171875, "epoch": 1.7024303497332542, "mse_loss": 0.055699028074741364, "step": 14360 }, { "epoch": 1.7036158861885005, "grad_norm": 0.41796875, "learning_rate": 0.00019095398691453943, "loss": 0.852, "step": 14370 }, { "contrastive_loss": 3.9708251953125, "epoch": 1.7036158861885005, "mse_loss": 0.057079143822193146, "step": 14370 }, { "epoch": 1.7048014226437465, "grad_norm": 0.435546875, "learning_rate": 0.00019093679890326513, "loss": 0.8491, "step": 14380 }, { "contrastive_loss": 4.010009765625, "epoch": 1.7048014226437465, "mse_loss": 0.06471068412065506, "step": 14380 }, { "epoch": 1.7059869590989925, "grad_norm": 0.423828125, "learning_rate": 0.00019091959535337907, "loss": 0.8579, "step": 14390 }, { "contrastive_loss": 3.92578125, "epoch": 1.7059869590989925, "mse_loss": 0.07942307740449905, "step": 14390 }, { "epoch": 1.7071724955542384, "grad_norm": 0.423828125, "learning_rate": 0.0001909023762678208, "loss": 0.8618, "step": 14400 }, { "contrastive_loss": 3.9122314453125, "epoch": 1.7071724955542384, "mse_loss": 0.06638967245817184, "step": 14400 }, { "epoch": 1.7083580320094844, "grad_norm": 0.5546875, "learning_rate": 0.0001908851416495326, "loss": 0.8433, "step": 14410 }, { "contrastive_loss": 3.84716796875, "epoch": 1.7083580320094844, "mse_loss": 0.07783125340938568, "step": 14410 }, { "epoch": 1.7095435684647304, "grad_norm": 0.35546875, "learning_rate": 0.00019086789150145943, "loss": 0.847, "step": 14420 }, { "contrastive_loss": 3.895263671875, "epoch": 1.7095435684647304, "mse_loss": 0.05417821183800697, "step": 14420 }, { "epoch": 1.7107291049199764, "grad_norm": 0.478515625, "learning_rate": 0.00019085062582654882, "loss": 0.8441, "step": 14430 }, { "contrastive_loss": 3.884521484375, "epoch": 1.7107291049199764, "mse_loss": 0.04733944684267044, "step": 14430 }, { "epoch": 1.7119146413752224, "grad_norm": 0.462890625, "learning_rate": 0.00019083334462775104, "loss": 0.8411, "step": 14440 }, { "contrastive_loss": 3.8492431640625, "epoch": 1.7119146413752224, "mse_loss": 0.06671660393476486, "step": 14440 }, { "epoch": 1.7131001778304684, "grad_norm": 0.50390625, "learning_rate": 0.00019081604790801898, "loss": 0.8504, "step": 14450 }, { "contrastive_loss": 3.92236328125, "epoch": 1.7131001778304684, "mse_loss": 0.06584583967924118, "step": 14450 }, { "epoch": 1.7142857142857144, "grad_norm": 0.369140625, "learning_rate": 0.00019079873567030812, "loss": 0.8449, "step": 14460 }, { "contrastive_loss": 3.874267578125, "epoch": 1.7142857142857144, "mse_loss": 0.057458944618701935, "step": 14460 }, { "epoch": 1.7154712507409604, "grad_norm": 0.49609375, "learning_rate": 0.0001907814079175767, "loss": 0.8562, "step": 14470 }, { "contrastive_loss": 3.888427734375, "epoch": 1.7154712507409604, "mse_loss": 0.07476075738668442, "step": 14470 }, { "epoch": 1.7166567871962064, "grad_norm": 0.49609375, "learning_rate": 0.00019076406465278554, "loss": 0.8485, "step": 14480 }, { "contrastive_loss": 3.92041015625, "epoch": 1.7166567871962064, "mse_loss": 0.07083828002214432, "step": 14480 }, { "epoch": 1.7178423236514524, "grad_norm": 0.68359375, "learning_rate": 0.00019074670587889813, "loss": 0.8462, "step": 14490 }, { "contrastive_loss": 3.875, "epoch": 1.7178423236514524, "mse_loss": 0.05497996136546135, "step": 14490 }, { "epoch": 1.7190278601066984, "grad_norm": 0.4453125, "learning_rate": 0.00019072933159888065, "loss": 0.8433, "step": 14500 }, { "contrastive_loss": 3.9981689453125, "epoch": 1.7190278601066984, "mse_loss": 0.09527669847011566, "step": 14500 }, { "epoch": 1.7202133965619444, "grad_norm": 0.40234375, "learning_rate": 0.00019071194181570183, "loss": 0.8514, "step": 14510 }, { "contrastive_loss": 4.0467529296875, "epoch": 1.7202133965619444, "mse_loss": 0.07071895152330399, "step": 14510 }, { "epoch": 1.7213989330171904, "grad_norm": 0.439453125, "learning_rate": 0.00019069453653233312, "loss": 0.849, "step": 14520 }, { "contrastive_loss": 3.88720703125, "epoch": 1.7213989330171904, "mse_loss": 0.06592447310686111, "step": 14520 }, { "epoch": 1.7225844694724364, "grad_norm": 0.3828125, "learning_rate": 0.0001906771157517486, "loss": 0.8434, "step": 14530 }, { "contrastive_loss": 3.7860107421875, "epoch": 1.7225844694724364, "mse_loss": 0.10043050348758698, "step": 14530 }, { "epoch": 1.7237700059276824, "grad_norm": 0.515625, "learning_rate": 0.00019065967947692503, "loss": 0.8511, "step": 14540 }, { "contrastive_loss": 3.917724609375, "epoch": 1.7237700059276824, "mse_loss": 0.06849000602960587, "step": 14540 }, { "epoch": 1.7249555423829284, "grad_norm": 0.439453125, "learning_rate": 0.0001906422277108418, "loss": 0.8619, "step": 14550 }, { "contrastive_loss": 3.940185546875, "epoch": 1.7249555423829284, "mse_loss": 0.05795273557305336, "step": 14550 }, { "epoch": 1.7261410788381744, "grad_norm": 0.41015625, "learning_rate": 0.00019062476045648093, "loss": 0.8579, "step": 14560 }, { "contrastive_loss": 3.986083984375, "epoch": 1.7261410788381744, "mse_loss": 0.06806298345327377, "step": 14560 }, { "epoch": 1.7273266152934204, "grad_norm": 0.39453125, "learning_rate": 0.0001906072777168271, "loss": 0.851, "step": 14570 }, { "contrastive_loss": 3.8634033203125, "epoch": 1.7273266152934204, "mse_loss": 0.0758732408285141, "step": 14570 }, { "epoch": 1.7285121517486663, "grad_norm": 0.5546875, "learning_rate": 0.0001905897794948676, "loss": 0.8479, "step": 14580 }, { "contrastive_loss": 4.0054931640625, "epoch": 1.7285121517486663, "mse_loss": 0.05523990839719772, "step": 14580 }, { "epoch": 1.7296976882039123, "grad_norm": 0.400390625, "learning_rate": 0.00019057226579359245, "loss": 0.8486, "step": 14590 }, { "contrastive_loss": 3.869873046875, "epoch": 1.7296976882039123, "mse_loss": 0.04850577935576439, "step": 14590 }, { "epoch": 1.7308832246591583, "grad_norm": 0.55859375, "learning_rate": 0.0001905547366159942, "loss": 0.8539, "step": 14600 }, { "contrastive_loss": 3.80810546875, "epoch": 1.7308832246591583, "mse_loss": 0.08619803935289383, "step": 14600 }, { "epoch": 1.7320687611144043, "grad_norm": 0.474609375, "learning_rate": 0.00019053719196506815, "loss": 0.8475, "step": 14610 }, { "contrastive_loss": 4.1270751953125, "epoch": 1.7320687611144043, "mse_loss": 0.07681621611118317, "step": 14610 }, { "epoch": 1.7332542975696503, "grad_norm": 0.474609375, "learning_rate": 0.00019051963184381219, "loss": 0.8617, "step": 14620 }, { "contrastive_loss": 3.9483642578125, "epoch": 1.7332542975696503, "mse_loss": 0.08283615112304688, "step": 14620 }, { "epoch": 1.7344398340248963, "grad_norm": 0.44140625, "learning_rate": 0.00019050205625522685, "loss": 0.86, "step": 14630 }, { "contrastive_loss": 3.8192138671875, "epoch": 1.7344398340248963, "mse_loss": 0.07313638180494308, "step": 14630 }, { "epoch": 1.7356253704801423, "grad_norm": 0.470703125, "learning_rate": 0.00019048446520231535, "loss": 0.8549, "step": 14640 }, { "contrastive_loss": 3.9290771484375, "epoch": 1.7356253704801423, "mse_loss": 0.07378504425287247, "step": 14640 }, { "epoch": 1.7368109069353883, "grad_norm": 0.4296875, "learning_rate": 0.0001904668586880835, "loss": 0.8444, "step": 14650 }, { "contrastive_loss": 3.8753662109375, "epoch": 1.7368109069353883, "mse_loss": 0.04171419143676758, "step": 14650 }, { "epoch": 1.7379964433906343, "grad_norm": 0.4375, "learning_rate": 0.00019044923671553978, "loss": 0.8499, "step": 14660 }, { "contrastive_loss": 3.8289794921875, "epoch": 1.7379964433906343, "mse_loss": 0.07734154909849167, "step": 14660 }, { "epoch": 1.7391819798458803, "grad_norm": 0.54296875, "learning_rate": 0.00019043159928769528, "loss": 0.8559, "step": 14670 }, { "contrastive_loss": 3.99267578125, "epoch": 1.7391819798458803, "mse_loss": 0.057911764830350876, "step": 14670 }, { "epoch": 1.7403675163011263, "grad_norm": 0.427734375, "learning_rate": 0.0001904139464075638, "loss": 0.8532, "step": 14680 }, { "contrastive_loss": 3.92578125, "epoch": 1.7403675163011263, "mse_loss": 0.07063419371843338, "step": 14680 }, { "epoch": 1.7415530527563723, "grad_norm": 0.431640625, "learning_rate": 0.00019039627807816166, "loss": 0.8488, "step": 14690 }, { "contrastive_loss": 3.8084716796875, "epoch": 1.7415530527563723, "mse_loss": 0.07597362250089645, "step": 14690 }, { "epoch": 1.7427385892116183, "grad_norm": 0.490234375, "learning_rate": 0.000190378594302508, "loss": 0.8437, "step": 14700 }, { "contrastive_loss": 4.0162353515625, "epoch": 1.7427385892116183, "mse_loss": 0.0953996330499649, "step": 14700 }, { "epoch": 1.7439241256668643, "grad_norm": 0.474609375, "learning_rate": 0.00019036089508362437, "loss": 0.8664, "step": 14710 }, { "contrastive_loss": 3.9066162109375, "epoch": 1.7439241256668643, "mse_loss": 0.07970988750457764, "step": 14710 }, { "epoch": 1.7451096621221103, "grad_norm": 0.5234375, "learning_rate": 0.0001903431804245352, "loss": 0.8553, "step": 14720 }, { "contrastive_loss": 3.90234375, "epoch": 1.7451096621221103, "mse_loss": 0.09824379533529282, "step": 14720 }, { "epoch": 1.7462951985773563, "grad_norm": 0.51171875, "learning_rate": 0.00019032545032826736, "loss": 0.8523, "step": 14730 }, { "contrastive_loss": 3.9796142578125, "epoch": 1.7462951985773563, "mse_loss": 0.09935346990823746, "step": 14730 }, { "epoch": 1.7474807350326023, "grad_norm": 0.51953125, "learning_rate": 0.0001903077047978505, "loss": 0.8587, "step": 14740 }, { "contrastive_loss": 3.8946533203125, "epoch": 1.7474807350326023, "mse_loss": 0.047646306455135345, "step": 14740 }, { "epoch": 1.7486662714878483, "grad_norm": 0.486328125, "learning_rate": 0.00019028994383631678, "loss": 0.8457, "step": 14750 }, { "contrastive_loss": 3.9129638671875, "epoch": 1.7486662714878483, "mse_loss": 0.07019086182117462, "step": 14750 }, { "epoch": 1.7498518079430943, "grad_norm": 0.48828125, "learning_rate": 0.0001902721674467011, "loss": 0.8467, "step": 14760 }, { "contrastive_loss": 3.9910888671875, "epoch": 1.7498518079430943, "mse_loss": 0.09065079689025879, "step": 14760 }, { "epoch": 1.7510373443983402, "grad_norm": 0.482421875, "learning_rate": 0.0001902543756320409, "loss": 0.8591, "step": 14770 }, { "contrastive_loss": 3.7587890625, "epoch": 1.7510373443983402, "mse_loss": 0.06144343689084053, "step": 14770 }, { "epoch": 1.7522228808535862, "grad_norm": 0.60546875, "learning_rate": 0.00019023656839537646, "loss": 0.8408, "step": 14780 }, { "contrastive_loss": 3.9578857421875, "epoch": 1.7522228808535862, "mse_loss": 0.08994000405073166, "step": 14780 }, { "epoch": 1.7534084173088322, "grad_norm": 0.37109375, "learning_rate": 0.00019021874573975042, "loss": 0.8433, "step": 14790 }, { "contrastive_loss": 3.947021484375, "epoch": 1.7534084173088322, "mse_loss": 0.09081489592790604, "step": 14790 }, { "epoch": 1.7545939537640782, "grad_norm": 0.4453125, "learning_rate": 0.00019020090766820816, "loss": 0.8449, "step": 14800 }, { "contrastive_loss": 3.813720703125, "epoch": 1.7545939537640782, "mse_loss": 0.0422021821141243, "step": 14800 }, { "epoch": 1.7557794902193242, "grad_norm": 0.4140625, "learning_rate": 0.00019018305418379785, "loss": 0.8453, "step": 14810 }, { "contrastive_loss": 4.00634765625, "epoch": 1.7557794902193242, "mse_loss": 0.06850408017635345, "step": 14810 }, { "epoch": 1.7569650266745702, "grad_norm": 0.388671875, "learning_rate": 0.00019016518528957007, "loss": 0.859, "step": 14820 }, { "contrastive_loss": 3.905029296875, "epoch": 1.7569650266745702, "mse_loss": 0.06490639597177505, "step": 14820 }, { "epoch": 1.7581505631298162, "grad_norm": 0.52734375, "learning_rate": 0.00019014730098857819, "loss": 0.8517, "step": 14830 }, { "contrastive_loss": 4.1912841796875, "epoch": 1.7581505631298162, "mse_loss": 0.05730307847261429, "step": 14830 }, { "epoch": 1.7593360995850622, "grad_norm": 0.427734375, "learning_rate": 0.00019012940128387804, "loss": 0.8472, "step": 14840 }, { "contrastive_loss": 3.8482666015625, "epoch": 1.7593360995850622, "mse_loss": 0.06615209579467773, "step": 14840 }, { "epoch": 1.7605216360403082, "grad_norm": 0.5390625, "learning_rate": 0.00019011148617852829, "loss": 0.8508, "step": 14850 }, { "contrastive_loss": 3.908447265625, "epoch": 1.7605216360403082, "mse_loss": 0.09070729464292526, "step": 14850 }, { "epoch": 1.7617071724955542, "grad_norm": 0.48046875, "learning_rate": 0.0001900935556755901, "loss": 0.8489, "step": 14860 }, { "contrastive_loss": 3.933837890625, "epoch": 1.7617071724955542, "mse_loss": 0.07652665674686432, "step": 14860 }, { "epoch": 1.7628927089508002, "grad_norm": 0.466796875, "learning_rate": 0.0001900756097781273, "loss": 0.8436, "step": 14870 }, { "contrastive_loss": 3.833740234375, "epoch": 1.7628927089508002, "mse_loss": 0.05766530707478523, "step": 14870 }, { "epoch": 1.7640782454060462, "grad_norm": 0.4765625, "learning_rate": 0.00019005764848920639, "loss": 0.8548, "step": 14880 }, { "contrastive_loss": 3.8468017578125, "epoch": 1.7640782454060462, "mse_loss": 0.06025577709078789, "step": 14880 }, { "epoch": 1.7652637818612922, "grad_norm": 0.40234375, "learning_rate": 0.00019003967181189642, "loss": 0.8465, "step": 14890 }, { "contrastive_loss": 4.063232421875, "epoch": 1.7652637818612922, "mse_loss": 0.07484577596187592, "step": 14890 }, { "epoch": 1.7664493183165382, "grad_norm": 0.392578125, "learning_rate": 0.0001900216797492691, "loss": 0.8479, "step": 14900 }, { "contrastive_loss": 3.879150390625, "epoch": 1.7664493183165382, "mse_loss": 0.048637039959430695, "step": 14900 }, { "epoch": 1.7676348547717842, "grad_norm": 0.44921875, "learning_rate": 0.00019000367230439884, "loss": 0.8492, "step": 14910 }, { "contrastive_loss": 4.0244140625, "epoch": 1.7676348547717842, "mse_loss": 0.05747099593281746, "step": 14910 }, { "epoch": 1.7688203912270302, "grad_norm": 0.484375, "learning_rate": 0.0001899856494803626, "loss": 0.8612, "step": 14920 }, { "contrastive_loss": 3.8101806640625, "epoch": 1.7688203912270302, "mse_loss": 0.043078966438770294, "step": 14920 }, { "epoch": 1.7700059276822762, "grad_norm": 0.427734375, "learning_rate": 0.00018996761128023995, "loss": 0.8409, "step": 14930 }, { "contrastive_loss": 4.0010986328125, "epoch": 1.7700059276822762, "mse_loss": 0.06357394903898239, "step": 14930 }, { "epoch": 1.7711914641375222, "grad_norm": 0.453125, "learning_rate": 0.00018994955770711312, "loss": 0.8561, "step": 14940 }, { "contrastive_loss": 3.8572998046875, "epoch": 1.7711914641375222, "mse_loss": 0.08413626253604889, "step": 14940 }, { "epoch": 1.7723770005927681, "grad_norm": 0.45703125, "learning_rate": 0.00018993148876406707, "loss": 0.8597, "step": 14950 }, { "contrastive_loss": 3.900390625, "epoch": 1.7723770005927681, "mse_loss": 0.054650742560625076, "step": 14950 }, { "epoch": 1.7735625370480141, "grad_norm": 0.40234375, "learning_rate": 0.00018991340445418918, "loss": 0.849, "step": 14960 }, { "contrastive_loss": 3.7476806640625, "epoch": 1.7735625370480141, "mse_loss": 0.05198974534869194, "step": 14960 }, { "epoch": 1.7747480735032601, "grad_norm": 0.4296875, "learning_rate": 0.00018989530478056966, "loss": 0.8397, "step": 14970 }, { "contrastive_loss": 3.90625, "epoch": 1.7747480735032601, "mse_loss": 0.0666404590010643, "step": 14970 }, { "epoch": 1.7759336099585061, "grad_norm": 0.47265625, "learning_rate": 0.00018987718974630113, "loss": 0.8609, "step": 14980 }, { "contrastive_loss": 4.0101318359375, "epoch": 1.7759336099585061, "mse_loss": 0.05688715726137161, "step": 14980 }, { "epoch": 1.7771191464137521, "grad_norm": 0.423828125, "learning_rate": 0.00018985905935447905, "loss": 0.8574, "step": 14990 }, { "contrastive_loss": 4.06640625, "epoch": 1.7771191464137521, "mse_loss": 0.07430296391248703, "step": 14990 }, { "epoch": 1.7783046828689981, "grad_norm": 0.333984375, "learning_rate": 0.00018984091360820136, "loss": 0.8569, "step": 15000 }, { "contrastive_loss": 3.8106689453125, "epoch": 1.7783046828689981, "mse_loss": 0.10397563874721527, "step": 15000 }, { "epoch": 1.7794902193242441, "grad_norm": 0.349609375, "learning_rate": 0.00018982275251056872, "loss": 0.8489, "step": 15010 }, { "contrastive_loss": 3.817626953125, "epoch": 1.7794902193242441, "mse_loss": 0.08744395524263382, "step": 15010 }, { "epoch": 1.78067575577949, "grad_norm": 0.45703125, "learning_rate": 0.0001898045760646843, "loss": 0.8468, "step": 15020 }, { "contrastive_loss": 3.9140625, "epoch": 1.78067575577949, "mse_loss": 0.06391312927007675, "step": 15020 }, { "epoch": 1.781861292234736, "grad_norm": 0.427734375, "learning_rate": 0.00018978638427365402, "loss": 0.8492, "step": 15030 }, { "contrastive_loss": 3.968017578125, "epoch": 1.781861292234736, "mse_loss": 0.04915054515004158, "step": 15030 }, { "epoch": 1.783046828689982, "grad_norm": 0.3828125, "learning_rate": 0.00018976817714058631, "loss": 0.8444, "step": 15040 }, { "contrastive_loss": 3.9705810546875, "epoch": 1.783046828689982, "mse_loss": 0.08618758618831635, "step": 15040 }, { "epoch": 1.784232365145228, "grad_norm": 0.43359375, "learning_rate": 0.00018974995466859232, "loss": 0.8503, "step": 15050 }, { "contrastive_loss": 3.9149169921875, "epoch": 1.784232365145228, "mse_loss": 0.053402166813611984, "step": 15050 }, { "epoch": 1.785417901600474, "grad_norm": 0.44921875, "learning_rate": 0.00018973171686078571, "loss": 0.8451, "step": 15060 }, { "contrastive_loss": 4.0606689453125, "epoch": 1.785417901600474, "mse_loss": 0.0726701095700264, "step": 15060 }, { "epoch": 1.78660343805572, "grad_norm": 0.44921875, "learning_rate": 0.00018971346372028287, "loss": 0.8452, "step": 15070 }, { "contrastive_loss": 3.822509765625, "epoch": 1.78660343805572, "mse_loss": 0.07857110351324081, "step": 15070 }, { "epoch": 1.787788974510966, "grad_norm": 0.5, "learning_rate": 0.00018969519525020273, "loss": 0.8404, "step": 15080 }, { "contrastive_loss": 3.958984375, "epoch": 1.787788974510966, "mse_loss": 0.0737016424536705, "step": 15080 }, { "epoch": 1.788974510966212, "grad_norm": 0.474609375, "learning_rate": 0.0001896769114536669, "loss": 0.8529, "step": 15090 }, { "contrastive_loss": 3.915771484375, "epoch": 1.788974510966212, "mse_loss": 0.05362662672996521, "step": 15090 }, { "epoch": 1.790160047421458, "grad_norm": 0.5, "learning_rate": 0.0001896586123337996, "loss": 0.8519, "step": 15100 }, { "contrastive_loss": 3.9537353515625, "epoch": 1.790160047421458, "mse_loss": 0.058111660182476044, "step": 15100 }, { "epoch": 1.791345583876704, "grad_norm": 0.50390625, "learning_rate": 0.0001896402978937276, "loss": 0.8517, "step": 15110 }, { "contrastive_loss": 3.845458984375, "epoch": 1.791345583876704, "mse_loss": 0.1277415007352829, "step": 15110 }, { "epoch": 1.79253112033195, "grad_norm": 0.50390625, "learning_rate": 0.00018962196813658032, "loss": 0.8511, "step": 15120 }, { "contrastive_loss": 4.0159912109375, "epoch": 1.79253112033195, "mse_loss": 0.06329239159822464, "step": 15120 }, { "epoch": 1.793716656787196, "grad_norm": 0.39453125, "learning_rate": 0.0001896036230654899, "loss": 0.8532, "step": 15130 }, { "contrastive_loss": 3.955322265625, "epoch": 1.793716656787196, "mse_loss": 0.05757637694478035, "step": 15130 }, { "epoch": 1.794902193242442, "grad_norm": 0.578125, "learning_rate": 0.00018958526268359095, "loss": 0.8471, "step": 15140 }, { "contrastive_loss": 4.0206298828125, "epoch": 1.794902193242442, "mse_loss": 0.06454608589410782, "step": 15140 }, { "epoch": 1.796087729697688, "grad_norm": 0.43359375, "learning_rate": 0.00018956688699402077, "loss": 0.8487, "step": 15150 }, { "contrastive_loss": 3.9556884765625, "epoch": 1.796087729697688, "mse_loss": 0.0627535954117775, "step": 15150 }, { "epoch": 1.7972732661529343, "grad_norm": 0.455078125, "learning_rate": 0.00018954849599991927, "loss": 0.8516, "step": 15160 }, { "contrastive_loss": 3.87646484375, "epoch": 1.7972732661529343, "mse_loss": 0.05173375830054283, "step": 15160 }, { "epoch": 1.7984588026081803, "grad_norm": 0.37890625, "learning_rate": 0.00018953008970442895, "loss": 0.8437, "step": 15170 }, { "contrastive_loss": 3.9283447265625, "epoch": 1.7984588026081803, "mse_loss": 0.06598860770463943, "step": 15170 }, { "epoch": 1.7996443390634262, "grad_norm": 0.43359375, "learning_rate": 0.00018951166811069495, "loss": 0.8341, "step": 15180 }, { "contrastive_loss": 3.9039306640625, "epoch": 1.7996443390634262, "mse_loss": 0.06142723560333252, "step": 15180 }, { "epoch": 1.8008298755186722, "grad_norm": 0.470703125, "learning_rate": 0.00018949323122186503, "loss": 0.8515, "step": 15190 }, { "contrastive_loss": 3.952880859375, "epoch": 1.8008298755186722, "mse_loss": 0.0418257936835289, "step": 15190 }, { "epoch": 1.8020154119739182, "grad_norm": 0.49609375, "learning_rate": 0.00018947477904108955, "loss": 0.8568, "step": 15200 }, { "contrastive_loss": 3.9183349609375, "epoch": 1.8020154119739182, "mse_loss": 0.0863218829035759, "step": 15200 }, { "epoch": 1.8032009484291642, "grad_norm": 0.44140625, "learning_rate": 0.00018945631157152147, "loss": 0.8508, "step": 15210 }, { "contrastive_loss": 3.899169921875, "epoch": 1.8032009484291642, "mse_loss": 0.06890656054019928, "step": 15210 }, { "epoch": 1.8043864848844102, "grad_norm": 0.390625, "learning_rate": 0.00018943782881631634, "loss": 0.8518, "step": 15220 }, { "contrastive_loss": 3.9033203125, "epoch": 1.8043864848844102, "mse_loss": 0.062360554933547974, "step": 15220 }, { "epoch": 1.8055720213396562, "grad_norm": 0.419921875, "learning_rate": 0.00018941933077863243, "loss": 0.8463, "step": 15230 }, { "contrastive_loss": 3.8692626953125, "epoch": 1.8055720213396562, "mse_loss": 0.08881885558366776, "step": 15230 }, { "epoch": 1.8067575577949022, "grad_norm": 0.515625, "learning_rate": 0.0001894008174616305, "loss": 0.8608, "step": 15240 }, { "contrastive_loss": 3.8701171875, "epoch": 1.8067575577949022, "mse_loss": 0.08693311363458633, "step": 15240 }, { "epoch": 1.8079430942501482, "grad_norm": 0.4453125, "learning_rate": 0.00018938228886847397, "loss": 0.853, "step": 15250 }, { "contrastive_loss": 3.941162109375, "epoch": 1.8079430942501482, "mse_loss": 0.0807383731007576, "step": 15250 }, { "epoch": 1.8091286307053942, "grad_norm": 0.490234375, "learning_rate": 0.0001893637450023289, "loss": 0.8595, "step": 15260 }, { "contrastive_loss": 3.9676513671875, "epoch": 1.8091286307053942, "mse_loss": 0.06930112838745117, "step": 15260 }, { "epoch": 1.8103141671606402, "grad_norm": 0.41796875, "learning_rate": 0.00018934518586636394, "loss": 0.8509, "step": 15270 }, { "contrastive_loss": 3.939208984375, "epoch": 1.8103141671606402, "mse_loss": 0.08392124623060226, "step": 15270 }, { "epoch": 1.8114997036158862, "grad_norm": 0.515625, "learning_rate": 0.0001893266114637503, "loss": 0.8563, "step": 15280 }, { "contrastive_loss": 3.8990478515625, "epoch": 1.8114997036158862, "mse_loss": 0.0563315823674202, "step": 15280 }, { "epoch": 1.8126852400711322, "grad_norm": 0.384765625, "learning_rate": 0.0001893080217976618, "loss": 0.8444, "step": 15290 }, { "contrastive_loss": 3.8514404296875, "epoch": 1.8126852400711322, "mse_loss": 0.09536627680063248, "step": 15290 }, { "epoch": 1.8138707765263782, "grad_norm": 0.375, "learning_rate": 0.000189289416871275, "loss": 0.8433, "step": 15300 }, { "contrastive_loss": 3.90185546875, "epoch": 1.8138707765263782, "mse_loss": 0.07989440858364105, "step": 15300 }, { "epoch": 1.8150563129816242, "grad_norm": 0.4375, "learning_rate": 0.00018927079668776893, "loss": 0.8506, "step": 15310 }, { "contrastive_loss": 3.853271484375, "epoch": 1.8150563129816242, "mse_loss": 0.0650465115904808, "step": 15310 }, { "epoch": 1.8162418494368702, "grad_norm": 0.46875, "learning_rate": 0.00018925216125032526, "loss": 0.8514, "step": 15320 }, { "contrastive_loss": 3.867919921875, "epoch": 1.8162418494368702, "mse_loss": 0.054711371660232544, "step": 15320 }, { "epoch": 1.8174273858921162, "grad_norm": 0.796875, "learning_rate": 0.00018923351056212827, "loss": 0.846, "step": 15330 }, { "contrastive_loss": 3.9141845703125, "epoch": 1.8174273858921162, "mse_loss": 0.10961867868900299, "step": 15330 }, { "epoch": 1.8186129223473622, "grad_norm": 0.4296875, "learning_rate": 0.00018921484462636488, "loss": 0.8516, "step": 15340 }, { "contrastive_loss": 3.8575439453125, "epoch": 1.8186129223473622, "mse_loss": 0.06225809454917908, "step": 15340 }, { "epoch": 1.8197984588026082, "grad_norm": 0.41796875, "learning_rate": 0.00018919616344622458, "loss": 0.8445, "step": 15350 }, { "contrastive_loss": 3.801025390625, "epoch": 1.8197984588026082, "mse_loss": 0.06075737252831459, "step": 15350 }, { "epoch": 1.8209839952578541, "grad_norm": 0.515625, "learning_rate": 0.00018917746702489945, "loss": 0.8464, "step": 15360 }, { "contrastive_loss": 3.827880859375, "epoch": 1.8209839952578541, "mse_loss": 0.05839257687330246, "step": 15360 }, { "epoch": 1.8221695317131001, "grad_norm": 0.427734375, "learning_rate": 0.00018915875536558422, "loss": 0.8513, "step": 15370 }, { "contrastive_loss": 4.1505126953125, "epoch": 1.8221695317131001, "mse_loss": 0.06705641001462936, "step": 15370 }, { "epoch": 1.8233550681683461, "grad_norm": 0.392578125, "learning_rate": 0.0001891400284714762, "loss": 0.8539, "step": 15380 }, { "contrastive_loss": 3.826904296875, "epoch": 1.8233550681683461, "mse_loss": 0.04954742640256882, "step": 15380 }, { "epoch": 1.8245406046235921, "grad_norm": 0.484375, "learning_rate": 0.0001891212863457753, "loss": 0.8471, "step": 15390 }, { "contrastive_loss": 3.8421630859375, "epoch": 1.8245406046235921, "mse_loss": 0.0733788013458252, "step": 15390 }, { "epoch": 1.8257261410788381, "grad_norm": 0.435546875, "learning_rate": 0.00018910252899168403, "loss": 0.8675, "step": 15400 }, { "contrastive_loss": 3.8984375, "epoch": 1.8257261410788381, "mse_loss": 0.09047220647335052, "step": 15400 }, { "epoch": 1.8269116775340841, "grad_norm": 0.408203125, "learning_rate": 0.0001890837564124075, "loss": 0.841, "step": 15410 }, { "contrastive_loss": 3.9976806640625, "epoch": 1.8269116775340841, "mse_loss": 0.08400680869817734, "step": 15410 }, { "epoch": 1.8280972139893301, "grad_norm": 0.47265625, "learning_rate": 0.00018906496861115346, "loss": 0.8545, "step": 15420 }, { "contrastive_loss": 3.822998046875, "epoch": 1.8280972139893301, "mse_loss": 0.051121924072504044, "step": 15420 }, { "epoch": 1.8292827504445763, "grad_norm": 0.369140625, "learning_rate": 0.00018904616559113223, "loss": 0.8439, "step": 15430 }, { "contrastive_loss": 3.8779296875, "epoch": 1.8292827504445763, "mse_loss": 0.07309368997812271, "step": 15430 }, { "epoch": 1.8304682868998223, "grad_norm": 0.3984375, "learning_rate": 0.0001890273473555567, "loss": 0.8523, "step": 15440 }, { "contrastive_loss": 3.971923828125, "epoch": 1.8304682868998223, "mse_loss": 0.08889289200305939, "step": 15440 }, { "epoch": 1.8316538233550683, "grad_norm": 0.423828125, "learning_rate": 0.00018900851390764244, "loss": 0.8641, "step": 15450 }, { "contrastive_loss": 3.9505615234375, "epoch": 1.8316538233550683, "mse_loss": 0.05445437878370285, "step": 15450 }, { "epoch": 1.8328393598103143, "grad_norm": 0.392578125, "learning_rate": 0.0001889896652506075, "loss": 0.8448, "step": 15460 }, { "contrastive_loss": 3.8934326171875, "epoch": 1.8328393598103143, "mse_loss": 0.06941484659910202, "step": 15460 }, { "epoch": 1.8340248962655603, "grad_norm": 0.41015625, "learning_rate": 0.00018897080138767267, "loss": 0.8538, "step": 15470 }, { "contrastive_loss": 3.900634765625, "epoch": 1.8340248962655603, "mse_loss": 0.08289007097482681, "step": 15470 }, { "epoch": 1.8352104327208063, "grad_norm": 0.41796875, "learning_rate": 0.00018895192232206123, "loss": 0.8438, "step": 15480 }, { "contrastive_loss": 3.8193359375, "epoch": 1.8352104327208063, "mse_loss": 0.07024415582418442, "step": 15480 }, { "epoch": 1.8363959691760523, "grad_norm": 0.57421875, "learning_rate": 0.0001889330280569991, "loss": 0.8426, "step": 15490 }, { "contrastive_loss": 3.902587890625, "epoch": 1.8363959691760523, "mse_loss": 0.08684486895799637, "step": 15490 }, { "epoch": 1.8375815056312983, "grad_norm": 0.41796875, "learning_rate": 0.0001889141185957148, "loss": 0.8512, "step": 15500 }, { "contrastive_loss": 3.9625244140625, "epoch": 1.8375815056312983, "mse_loss": 0.058643363416194916, "step": 15500 }, { "epoch": 1.8387670420865443, "grad_norm": 0.42578125, "learning_rate": 0.00018889519394143945, "loss": 0.8442, "step": 15510 }, { "contrastive_loss": 3.8927001953125, "epoch": 1.8387670420865443, "mse_loss": 0.06161708012223244, "step": 15510 }, { "epoch": 1.8399525785417903, "grad_norm": 0.373046875, "learning_rate": 0.00018887625409740673, "loss": 0.8385, "step": 15520 }, { "contrastive_loss": 3.9022216796875, "epoch": 1.8399525785417903, "mse_loss": 0.0732872486114502, "step": 15520 }, { "epoch": 1.8411381149970363, "grad_norm": 0.50390625, "learning_rate": 0.00018885729906685297, "loss": 0.8487, "step": 15530 }, { "contrastive_loss": 3.843505859375, "epoch": 1.8411381149970363, "mse_loss": 0.08340024948120117, "step": 15530 }, { "epoch": 1.8423236514522823, "grad_norm": 0.51953125, "learning_rate": 0.00018883832885301704, "loss": 0.8467, "step": 15540 }, { "contrastive_loss": 4.067138671875, "epoch": 1.8423236514522823, "mse_loss": 0.05543488264083862, "step": 15540 }, { "epoch": 1.8435091879075283, "grad_norm": 0.435546875, "learning_rate": 0.00018881934345914045, "loss": 0.8452, "step": 15550 }, { "contrastive_loss": 3.777099609375, "epoch": 1.8435091879075283, "mse_loss": 0.08594127744436264, "step": 15550 }, { "epoch": 1.8446947243627743, "grad_norm": 0.5, "learning_rate": 0.00018880034288846728, "loss": 0.8526, "step": 15560 }, { "contrastive_loss": 3.8931884765625, "epoch": 1.8446947243627743, "mse_loss": 0.0746268555521965, "step": 15560 }, { "epoch": 1.8458802608180203, "grad_norm": 0.3828125, "learning_rate": 0.00018878132714424418, "loss": 0.853, "step": 15570 }, { "contrastive_loss": 3.9779052734375, "epoch": 1.8458802608180203, "mse_loss": 0.07142063230276108, "step": 15570 }, { "epoch": 1.8470657972732663, "grad_norm": 0.3984375, "learning_rate": 0.00018876229622972045, "loss": 0.8517, "step": 15580 }, { "contrastive_loss": 4.08984375, "epoch": 1.8470657972732663, "mse_loss": 0.08433490246534348, "step": 15580 }, { "epoch": 1.8482513337285122, "grad_norm": 0.412109375, "learning_rate": 0.000188743250148148, "loss": 0.8504, "step": 15590 }, { "contrastive_loss": 4.0509033203125, "epoch": 1.8482513337285122, "mse_loss": 0.05227569118142128, "step": 15590 }, { "epoch": 1.8494368701837582, "grad_norm": 0.578125, "learning_rate": 0.00018872418890278117, "loss": 0.8524, "step": 15600 }, { "contrastive_loss": 3.9217529296875, "epoch": 1.8494368701837582, "mse_loss": 0.06489522010087967, "step": 15600 }, { "epoch": 1.8506224066390042, "grad_norm": 0.478515625, "learning_rate": 0.0001887051124968771, "loss": 0.8487, "step": 15610 }, { "contrastive_loss": 3.9833984375, "epoch": 1.8506224066390042, "mse_loss": 0.05061572045087814, "step": 15610 }, { "epoch": 1.8518079430942502, "grad_norm": 0.373046875, "learning_rate": 0.0001886860209336954, "loss": 0.8479, "step": 15620 }, { "contrastive_loss": 3.865478515625, "epoch": 1.8518079430942502, "mse_loss": 0.08026949316263199, "step": 15620 }, { "epoch": 1.8529934795494962, "grad_norm": 0.32421875, "learning_rate": 0.00018866691421649828, "loss": 0.8258, "step": 15630 }, { "contrastive_loss": 3.818603515625, "epoch": 1.8529934795494962, "mse_loss": 0.06284630298614502, "step": 15630 }, { "epoch": 1.8541790160047422, "grad_norm": 0.5, "learning_rate": 0.00018864779234855058, "loss": 0.8361, "step": 15640 }, { "contrastive_loss": 3.91259765625, "epoch": 1.8541790160047422, "mse_loss": 0.0774337500333786, "step": 15640 }, { "epoch": 1.8553645524599882, "grad_norm": 0.46875, "learning_rate": 0.00018862865533311968, "loss": 0.8533, "step": 15650 }, { "contrastive_loss": 3.77685546875, "epoch": 1.8553645524599882, "mse_loss": 0.06117485091090202, "step": 15650 }, { "epoch": 1.8565500889152342, "grad_norm": 0.3671875, "learning_rate": 0.00018860950317347555, "loss": 0.832, "step": 15660 }, { "contrastive_loss": 3.9693603515625, "epoch": 1.8565500889152342, "mse_loss": 0.07879924774169922, "step": 15660 }, { "epoch": 1.8577356253704802, "grad_norm": 0.326171875, "learning_rate": 0.00018859033587289084, "loss": 0.8457, "step": 15670 }, { "contrastive_loss": 3.8658447265625, "epoch": 1.8577356253704802, "mse_loss": 0.07932048290967941, "step": 15670 }, { "epoch": 1.8589211618257262, "grad_norm": 0.439453125, "learning_rate": 0.00018857115343464068, "loss": 0.8471, "step": 15680 }, { "contrastive_loss": 3.9193115234375, "epoch": 1.8589211618257262, "mse_loss": 0.06401190906763077, "step": 15680 }, { "epoch": 1.8601066982809722, "grad_norm": 0.48828125, "learning_rate": 0.0001885519558620028, "loss": 0.8368, "step": 15690 }, { "contrastive_loss": 3.8524169921875, "epoch": 1.8601066982809722, "mse_loss": 0.09662923961877823, "step": 15690 }, { "epoch": 1.8612922347362182, "grad_norm": 0.55078125, "learning_rate": 0.00018853274315825758, "loss": 0.843, "step": 15700 }, { "contrastive_loss": 3.9581298828125, "epoch": 1.8612922347362182, "mse_loss": 0.07588206231594086, "step": 15700 }, { "epoch": 1.8624777711914642, "grad_norm": 0.455078125, "learning_rate": 0.00018851351532668794, "loss": 0.8601, "step": 15710 }, { "contrastive_loss": 4.0927734375, "epoch": 1.8624777711914642, "mse_loss": 0.07081577181816101, "step": 15710 }, { "epoch": 1.8636633076467102, "grad_norm": 0.44921875, "learning_rate": 0.00018849427237057937, "loss": 0.852, "step": 15720 }, { "contrastive_loss": 3.895263671875, "epoch": 1.8636633076467102, "mse_loss": 0.08709901571273804, "step": 15720 }, { "epoch": 1.8648488441019562, "grad_norm": 0.58203125, "learning_rate": 0.00018847501429322, "loss": 0.8427, "step": 15730 }, { "contrastive_loss": 3.9603271484375, "epoch": 1.8648488441019562, "mse_loss": 0.07462495565414429, "step": 15730 }, { "epoch": 1.8660343805572022, "grad_norm": 0.45703125, "learning_rate": 0.00018845574109790044, "loss": 0.8511, "step": 15740 }, { "contrastive_loss": 3.87890625, "epoch": 1.8660343805572022, "mse_loss": 0.05351719260215759, "step": 15740 }, { "epoch": 1.8672199170124482, "grad_norm": 0.51171875, "learning_rate": 0.000188436452787914, "loss": 0.8518, "step": 15750 }, { "contrastive_loss": 4.1253662109375, "epoch": 1.8672199170124482, "mse_loss": 0.06753219664096832, "step": 15750 }, { "epoch": 1.8684054534676942, "grad_norm": 0.46875, "learning_rate": 0.00018841714936655655, "loss": 0.8622, "step": 15760 }, { "contrastive_loss": 4.0128173828125, "epoch": 1.8684054534676942, "mse_loss": 0.08618521690368652, "step": 15760 }, { "epoch": 1.8695909899229401, "grad_norm": 0.447265625, "learning_rate": 0.00018839783083712645, "loss": 0.8564, "step": 15770 }, { "contrastive_loss": 3.9154052734375, "epoch": 1.8695909899229401, "mse_loss": 0.05627689138054848, "step": 15770 }, { "epoch": 1.8707765263781861, "grad_norm": 0.369140625, "learning_rate": 0.0001883784972029248, "loss": 0.8621, "step": 15780 }, { "contrastive_loss": 3.864013671875, "epoch": 1.8707765263781861, "mse_loss": 0.06564804166555405, "step": 15780 }, { "epoch": 1.8719620628334321, "grad_norm": 0.3828125, "learning_rate": 0.00018835914846725512, "loss": 0.8477, "step": 15790 }, { "contrastive_loss": 3.8865966796875, "epoch": 1.8719620628334321, "mse_loss": 0.07803268730640411, "step": 15790 }, { "epoch": 1.8731475992886781, "grad_norm": 0.392578125, "learning_rate": 0.00018833978463342357, "loss": 0.85, "step": 15800 }, { "contrastive_loss": 3.956787109375, "epoch": 1.8731475992886781, "mse_loss": 0.061028603464365005, "step": 15800 }, { "epoch": 1.8743331357439241, "grad_norm": 0.373046875, "learning_rate": 0.00018832040570473891, "loss": 0.844, "step": 15810 }, { "contrastive_loss": 3.8797607421875, "epoch": 1.8743331357439241, "mse_loss": 0.052865978330373764, "step": 15810 }, { "epoch": 1.8755186721991701, "grad_norm": 0.43359375, "learning_rate": 0.00018830101168451253, "loss": 0.8532, "step": 15820 }, { "contrastive_loss": 3.778076171875, "epoch": 1.8755186721991701, "mse_loss": 0.06108846887946129, "step": 15820 }, { "epoch": 1.8767042086544161, "grad_norm": 0.447265625, "learning_rate": 0.00018828160257605827, "loss": 0.8513, "step": 15830 }, { "contrastive_loss": 3.8427734375, "epoch": 1.8767042086544161, "mse_loss": 0.06651557981967926, "step": 15830 }, { "epoch": 1.8778897451096621, "grad_norm": 0.494140625, "learning_rate": 0.00018826217838269264, "loss": 0.837, "step": 15840 }, { "contrastive_loss": 3.968505859375, "epoch": 1.8778897451096621, "mse_loss": 0.09170757234096527, "step": 15840 }, { "epoch": 1.879075281564908, "grad_norm": 0.40625, "learning_rate": 0.00018824273910773468, "loss": 0.8514, "step": 15850 }, { "contrastive_loss": 3.7774658203125, "epoch": 1.879075281564908, "mse_loss": 0.05701256915926933, "step": 15850 }, { "epoch": 1.880260818020154, "grad_norm": 0.431640625, "learning_rate": 0.00018822328475450606, "loss": 0.8557, "step": 15860 }, { "contrastive_loss": 3.920166015625, "epoch": 1.880260818020154, "mse_loss": 0.0630163922905922, "step": 15860 }, { "epoch": 1.8814463544754, "grad_norm": 0.384765625, "learning_rate": 0.000188203815326331, "loss": 0.8502, "step": 15870 }, { "contrastive_loss": 4.0150146484375, "epoch": 1.8814463544754, "mse_loss": 0.07153116911649704, "step": 15870 }, { "epoch": 1.882631890930646, "grad_norm": 0.369140625, "learning_rate": 0.0001881843308265363, "loss": 0.8603, "step": 15880 }, { "contrastive_loss": 3.851318359375, "epoch": 1.882631890930646, "mse_loss": 0.04391488432884216, "step": 15880 }, { "epoch": 1.883817427385892, "grad_norm": 0.53515625, "learning_rate": 0.00018816483125845128, "loss": 0.8506, "step": 15890 }, { "contrastive_loss": 3.9146728515625, "epoch": 1.883817427385892, "mse_loss": 0.06171527877449989, "step": 15890 }, { "epoch": 1.885002963841138, "grad_norm": 0.41015625, "learning_rate": 0.0001881453166254079, "loss": 0.8477, "step": 15900 }, { "contrastive_loss": 3.9373779296875, "epoch": 1.885002963841138, "mse_loss": 0.06870496273040771, "step": 15900 }, { "epoch": 1.886188500296384, "grad_norm": 0.41796875, "learning_rate": 0.0001881257869307407, "loss": 0.8528, "step": 15910 }, { "contrastive_loss": 3.86865234375, "epoch": 1.886188500296384, "mse_loss": 0.08736485987901688, "step": 15910 }, { "epoch": 1.88737403675163, "grad_norm": 0.423828125, "learning_rate": 0.00018810624217778678, "loss": 0.8446, "step": 15920 }, { "contrastive_loss": 3.7998046875, "epoch": 1.88737403675163, "mse_loss": 0.09907891601324081, "step": 15920 }, { "epoch": 1.888559573206876, "grad_norm": 0.5390625, "learning_rate": 0.00018808668236988576, "loss": 0.8639, "step": 15930 }, { "contrastive_loss": 3.837158203125, "epoch": 1.888559573206876, "mse_loss": 0.07475483417510986, "step": 15930 }, { "epoch": 1.889745109662122, "grad_norm": 0.66015625, "learning_rate": 0.0001880671075103799, "loss": 0.8497, "step": 15940 }, { "contrastive_loss": 3.9869384765625, "epoch": 1.889745109662122, "mse_loss": 0.060607314109802246, "step": 15940 }, { "epoch": 1.890930646117368, "grad_norm": 0.458984375, "learning_rate": 0.000188047517602614, "loss": 0.8604, "step": 15950 }, { "contrastive_loss": 3.9541015625, "epoch": 1.890930646117368, "mse_loss": 0.09503436088562012, "step": 15950 }, { "epoch": 1.892116182572614, "grad_norm": 0.482421875, "learning_rate": 0.00018802791264993548, "loss": 0.8522, "step": 15960 }, { "contrastive_loss": 3.984130859375, "epoch": 1.892116182572614, "mse_loss": 0.10718891769647598, "step": 15960 }, { "epoch": 1.89330171902786, "grad_norm": 0.69140625, "learning_rate": 0.00018800829265569423, "loss": 0.8543, "step": 15970 }, { "contrastive_loss": 3.93212890625, "epoch": 1.89330171902786, "mse_loss": 0.07337740808725357, "step": 15970 }, { "epoch": 1.894487255483106, "grad_norm": 0.458984375, "learning_rate": 0.0001879886576232428, "loss": 0.8572, "step": 15980 }, { "contrastive_loss": 3.8756103515625, "epoch": 1.894487255483106, "mse_loss": 0.07210779190063477, "step": 15980 }, { "epoch": 1.895672791938352, "grad_norm": 0.46875, "learning_rate": 0.0001879690075559363, "loss": 0.8492, "step": 15990 }, { "contrastive_loss": 3.9254150390625, "epoch": 1.895672791938352, "mse_loss": 0.056716032326221466, "step": 15990 }, { "epoch": 1.896858328393598, "grad_norm": 0.546875, "learning_rate": 0.0001879493424571323, "loss": 0.8548, "step": 16000 }, { "contrastive_loss": 3.80908203125, "epoch": 1.896858328393598, "mse_loss": 0.06356944143772125, "step": 16000 }, { "epoch": 1.898043864848844, "grad_norm": 0.46484375, "learning_rate": 0.00018792966233019116, "loss": 0.8392, "step": 16010 }, { "contrastive_loss": 3.8743896484375, "epoch": 1.898043864848844, "mse_loss": 0.04813525080680847, "step": 16010 }, { "epoch": 1.89922940130409, "grad_norm": 0.400390625, "learning_rate": 0.0001879099671784756, "loss": 0.8339, "step": 16020 }, { "contrastive_loss": 3.8443603515625, "epoch": 1.89922940130409, "mse_loss": 0.05631011351943016, "step": 16020 }, { "epoch": 1.900414937759336, "grad_norm": 0.3984375, "learning_rate": 0.000187890257005351, "loss": 0.8461, "step": 16030 }, { "contrastive_loss": 3.81103515625, "epoch": 1.900414937759336, "mse_loss": 0.09662651270627975, "step": 16030 }, { "epoch": 1.901600474214582, "grad_norm": 0.380859375, "learning_rate": 0.00018787053181418525, "loss": 0.8524, "step": 16040 }, { "contrastive_loss": 4.0616455078125, "epoch": 1.901600474214582, "mse_loss": 0.06900044530630112, "step": 16040 }, { "epoch": 1.902786010669828, "grad_norm": 0.462890625, "learning_rate": 0.00018785079160834887, "loss": 0.8613, "step": 16050 }, { "contrastive_loss": 3.8583984375, "epoch": 1.902786010669828, "mse_loss": 0.0979616716504097, "step": 16050 }, { "epoch": 1.903971547125074, "grad_norm": 0.419921875, "learning_rate": 0.00018783103639121495, "loss": 0.8467, "step": 16060 }, { "contrastive_loss": 3.9766845703125, "epoch": 1.903971547125074, "mse_loss": 0.0439307764172554, "step": 16060 }, { "epoch": 1.90515708358032, "grad_norm": 0.388671875, "learning_rate": 0.0001878112661661591, "loss": 0.848, "step": 16070 }, { "contrastive_loss": 3.87255859375, "epoch": 1.90515708358032, "mse_loss": 0.0804969072341919, "step": 16070 }, { "epoch": 1.906342620035566, "grad_norm": 0.458984375, "learning_rate": 0.0001877914809365595, "loss": 0.8547, "step": 16080 }, { "contrastive_loss": 3.8800048828125, "epoch": 1.906342620035566, "mse_loss": 0.07637478411197662, "step": 16080 }, { "epoch": 1.907528156490812, "grad_norm": 0.5078125, "learning_rate": 0.0001877716807057969, "loss": 0.8518, "step": 16090 }, { "contrastive_loss": 3.7845458984375, "epoch": 1.907528156490812, "mse_loss": 0.05889435485005379, "step": 16090 }, { "epoch": 1.908713692946058, "grad_norm": 0.34765625, "learning_rate": 0.00018775186547725464, "loss": 0.8408, "step": 16100 }, { "contrastive_loss": 3.912353515625, "epoch": 1.908713692946058, "mse_loss": 0.05464806780219078, "step": 16100 }, { "epoch": 1.909899229401304, "grad_norm": 0.5078125, "learning_rate": 0.00018773203525431859, "loss": 0.8479, "step": 16110 }, { "contrastive_loss": 4.0194091796875, "epoch": 1.909899229401304, "mse_loss": 0.0592101626098156, "step": 16110 }, { "epoch": 1.91108476585655, "grad_norm": 0.390625, "learning_rate": 0.0001877121900403772, "loss": 0.8467, "step": 16120 }, { "contrastive_loss": 3.882568359375, "epoch": 1.91108476585655, "mse_loss": 0.06302370876073837, "step": 16120 }, { "epoch": 1.912270302311796, "grad_norm": 0.404296875, "learning_rate": 0.00018769232983882142, "loss": 0.8437, "step": 16130 }, { "contrastive_loss": 3.9005126953125, "epoch": 1.912270302311796, "mse_loss": 0.049861710518598557, "step": 16130 }, { "epoch": 1.913455838767042, "grad_norm": 0.388671875, "learning_rate": 0.0001876724546530449, "loss": 0.8474, "step": 16140 }, { "contrastive_loss": 3.831787109375, "epoch": 1.913455838767042, "mse_loss": 0.048732299357652664, "step": 16140 }, { "epoch": 1.914641375222288, "grad_norm": 0.412109375, "learning_rate": 0.00018765256448644374, "loss": 0.8351, "step": 16150 }, { "contrastive_loss": 3.8673095703125, "epoch": 1.914641375222288, "mse_loss": 0.07394640892744064, "step": 16150 }, { "epoch": 1.915826911677534, "grad_norm": 0.5625, "learning_rate": 0.00018763265934241657, "loss": 0.8563, "step": 16160 }, { "contrastive_loss": 3.7161865234375, "epoch": 1.915826911677534, "mse_loss": 0.04542091116309166, "step": 16160 }, { "epoch": 1.91701244813278, "grad_norm": 0.48828125, "learning_rate": 0.0001876127392243647, "loss": 0.8411, "step": 16170 }, { "contrastive_loss": 3.917724609375, "epoch": 1.91701244813278, "mse_loss": 0.07160820066928864, "step": 16170 }, { "epoch": 1.918197984588026, "grad_norm": 0.546875, "learning_rate": 0.00018759280413569194, "loss": 0.8453, "step": 16180 }, { "contrastive_loss": 3.8529052734375, "epoch": 1.918197984588026, "mse_loss": 0.0851801186800003, "step": 16180 }, { "epoch": 1.919383521043272, "grad_norm": 0.52734375, "learning_rate": 0.00018757285407980457, "loss": 0.8546, "step": 16190 }, { "contrastive_loss": 3.8675537109375, "epoch": 1.919383521043272, "mse_loss": 0.06901567429304123, "step": 16190 }, { "epoch": 1.920569057498518, "grad_norm": 0.5546875, "learning_rate": 0.0001875528890601116, "loss": 0.852, "step": 16200 }, { "contrastive_loss": 3.7752685546875, "epoch": 1.920569057498518, "mse_loss": 0.06492412090301514, "step": 16200 }, { "epoch": 1.921754593953764, "grad_norm": 0.41015625, "learning_rate": 0.00018753290908002444, "loss": 0.8405, "step": 16210 }, { "contrastive_loss": 3.836669921875, "epoch": 1.921754593953764, "mse_loss": 0.06444888561964035, "step": 16210 }, { "epoch": 1.9229401304090101, "grad_norm": 0.46484375, "learning_rate": 0.00018751291414295716, "loss": 0.8422, "step": 16220 }, { "contrastive_loss": 3.9378662109375, "epoch": 1.9229401304090101, "mse_loss": 0.08626624196767807, "step": 16220 }, { "epoch": 1.9241256668642561, "grad_norm": 0.63671875, "learning_rate": 0.00018749290425232632, "loss": 0.8513, "step": 16230 }, { "contrastive_loss": 3.9764404296875, "epoch": 1.9241256668642561, "mse_loss": 0.06378837674856186, "step": 16230 }, { "epoch": 1.9253112033195021, "grad_norm": 0.416015625, "learning_rate": 0.0001874728794115511, "loss": 0.8418, "step": 16240 }, { "contrastive_loss": 3.841552734375, "epoch": 1.9253112033195021, "mse_loss": 0.09026629477739334, "step": 16240 }, { "epoch": 1.9264967397747481, "grad_norm": 0.466796875, "learning_rate": 0.00018745283962405318, "loss": 0.8566, "step": 16250 }, { "contrastive_loss": 3.8062744140625, "epoch": 1.9264967397747481, "mse_loss": 0.08766857534646988, "step": 16250 }, { "epoch": 1.927682276229994, "grad_norm": 0.431640625, "learning_rate": 0.0001874327848932568, "loss": 0.8586, "step": 16260 }, { "contrastive_loss": 3.7664794921875, "epoch": 1.927682276229994, "mse_loss": 0.06672387570142746, "step": 16260 }, { "epoch": 1.92886781268524, "grad_norm": 0.48828125, "learning_rate": 0.00018741271522258876, "loss": 0.8487, "step": 16270 }, { "contrastive_loss": 3.90380859375, "epoch": 1.92886781268524, "mse_loss": 0.05191916599869728, "step": 16270 }, { "epoch": 1.930053349140486, "grad_norm": 0.3671875, "learning_rate": 0.0001873926306154784, "loss": 0.8546, "step": 16280 }, { "contrastive_loss": 4.01220703125, "epoch": 1.930053349140486, "mse_loss": 0.06942696869373322, "step": 16280 }, { "epoch": 1.931238885595732, "grad_norm": 0.462890625, "learning_rate": 0.00018737253107535776, "loss": 0.8585, "step": 16290 }, { "contrastive_loss": 3.896240234375, "epoch": 1.931238885595732, "mse_loss": 0.07007528096437454, "step": 16290 }, { "epoch": 1.932424422050978, "grad_norm": 0.3671875, "learning_rate": 0.00018735241660566113, "loss": 0.8398, "step": 16300 }, { "contrastive_loss": 3.941650390625, "epoch": 1.932424422050978, "mse_loss": 0.06766221672296524, "step": 16300 }, { "epoch": 1.933609958506224, "grad_norm": 0.435546875, "learning_rate": 0.00018733228720982563, "loss": 0.8448, "step": 16310 }, { "contrastive_loss": 3.9879150390625, "epoch": 1.933609958506224, "mse_loss": 0.06698478013277054, "step": 16310 }, { "epoch": 1.93479549496147, "grad_norm": 0.4765625, "learning_rate": 0.00018731214289129078, "loss": 0.8423, "step": 16320 }, { "contrastive_loss": 4.0341796875, "epoch": 1.93479549496147, "mse_loss": 0.06554123014211655, "step": 16320 }, { "epoch": 1.935981031416716, "grad_norm": 0.43359375, "learning_rate": 0.00018729198365349868, "loss": 0.855, "step": 16330 }, { "contrastive_loss": 3.8897705078125, "epoch": 1.935981031416716, "mse_loss": 0.0853496789932251, "step": 16330 }, { "epoch": 1.937166567871962, "grad_norm": 0.38671875, "learning_rate": 0.000187271809499894, "loss": 0.8541, "step": 16340 }, { "contrastive_loss": 3.7657470703125, "epoch": 1.937166567871962, "mse_loss": 0.05373971909284592, "step": 16340 }, { "epoch": 1.938352104327208, "grad_norm": 0.4765625, "learning_rate": 0.00018725162043392403, "loss": 0.8501, "step": 16350 }, { "contrastive_loss": 3.951904296875, "epoch": 1.938352104327208, "mse_loss": 0.05876339226961136, "step": 16350 }, { "epoch": 1.939537640782454, "grad_norm": 0.546875, "learning_rate": 0.00018723141645903842, "loss": 0.847, "step": 16360 }, { "contrastive_loss": 4.01904296875, "epoch": 1.939537640782454, "mse_loss": 0.0596211738884449, "step": 16360 }, { "epoch": 1.9407231772377, "grad_norm": 0.478515625, "learning_rate": 0.00018721119757868953, "loss": 0.8515, "step": 16370 }, { "contrastive_loss": 4.0045166015625, "epoch": 1.9407231772377, "mse_loss": 0.06975740939378738, "step": 16370 }, { "epoch": 1.941908713692946, "grad_norm": 0.431640625, "learning_rate": 0.00018719096379633221, "loss": 0.8466, "step": 16380 }, { "contrastive_loss": 4.0699462890625, "epoch": 1.941908713692946, "mse_loss": 0.07873112708330154, "step": 16380 }, { "epoch": 1.943094250148192, "grad_norm": 0.515625, "learning_rate": 0.00018717071511542387, "loss": 0.8563, "step": 16390 }, { "contrastive_loss": 4.1026611328125, "epoch": 1.943094250148192, "mse_loss": 0.06586108356714249, "step": 16390 }, { "epoch": 1.944279786603438, "grad_norm": 0.435546875, "learning_rate": 0.00018715045153942442, "loss": 0.8448, "step": 16400 }, { "contrastive_loss": 3.8975830078125, "epoch": 1.944279786603438, "mse_loss": 0.081601083278656, "step": 16400 }, { "epoch": 1.945465323058684, "grad_norm": 0.462890625, "learning_rate": 0.00018713017307179637, "loss": 0.8566, "step": 16410 }, { "contrastive_loss": 3.8668212890625, "epoch": 1.945465323058684, "mse_loss": 0.0472777783870697, "step": 16410 }, { "epoch": 1.94665085951393, "grad_norm": 0.53515625, "learning_rate": 0.00018710987971600474, "loss": 0.847, "step": 16420 }, { "contrastive_loss": 3.9708251953125, "epoch": 1.94665085951393, "mse_loss": 0.06601804494857788, "step": 16420 }, { "epoch": 1.947836395969176, "grad_norm": 0.470703125, "learning_rate": 0.00018708957147551715, "loss": 0.8433, "step": 16430 }, { "contrastive_loss": 3.9522705078125, "epoch": 1.947836395969176, "mse_loss": 0.06702343374490738, "step": 16430 }, { "epoch": 1.949021932424422, "grad_norm": 0.419921875, "learning_rate": 0.00018706924835380372, "loss": 0.839, "step": 16440 }, { "contrastive_loss": 3.885009765625, "epoch": 1.949021932424422, "mse_loss": 0.07132306694984436, "step": 16440 }, { "epoch": 1.950207468879668, "grad_norm": 0.41796875, "learning_rate": 0.00018704891035433707, "loss": 0.839, "step": 16450 }, { "contrastive_loss": 3.8922119140625, "epoch": 1.950207468879668, "mse_loss": 0.03385934606194496, "step": 16450 }, { "epoch": 1.951393005334914, "grad_norm": 0.484375, "learning_rate": 0.00018702855748059242, "loss": 0.8447, "step": 16460 }, { "contrastive_loss": 3.931640625, "epoch": 1.951393005334914, "mse_loss": 0.06365964561700821, "step": 16460 }, { "epoch": 1.95257854179016, "grad_norm": 0.470703125, "learning_rate": 0.00018700818973604757, "loss": 0.84, "step": 16470 }, { "contrastive_loss": 3.875, "epoch": 1.95257854179016, "mse_loss": 0.058052729815244675, "step": 16470 }, { "epoch": 1.9537640782454062, "grad_norm": 0.3671875, "learning_rate": 0.00018698780712418276, "loss": 0.8491, "step": 16480 }, { "contrastive_loss": 3.959228515625, "epoch": 1.9537640782454062, "mse_loss": 0.08346835523843765, "step": 16480 }, { "epoch": 1.9549496147006522, "grad_norm": 0.546875, "learning_rate": 0.00018696740964848084, "loss": 0.8507, "step": 16490 }, { "contrastive_loss": 3.871337890625, "epoch": 1.9549496147006522, "mse_loss": 0.08912342041730881, "step": 16490 }, { "epoch": 1.9561351511558982, "grad_norm": 0.419921875, "learning_rate": 0.00018694699731242715, "loss": 0.8561, "step": 16500 }, { "contrastive_loss": 3.817138671875, "epoch": 1.9561351511558982, "mse_loss": 0.05604153499007225, "step": 16500 }, { "epoch": 1.9573206876111442, "grad_norm": 0.42578125, "learning_rate": 0.00018692657011950962, "loss": 0.8374, "step": 16510 }, { "contrastive_loss": 3.835205078125, "epoch": 1.9573206876111442, "mse_loss": 0.08100060373544693, "step": 16510 }, { "epoch": 1.9585062240663902, "grad_norm": 0.52734375, "learning_rate": 0.00018690612807321873, "loss": 0.8443, "step": 16520 }, { "contrastive_loss": 4.1519775390625, "epoch": 1.9585062240663902, "mse_loss": 0.08658143132925034, "step": 16520 }, { "epoch": 1.9596917605216362, "grad_norm": 0.4296875, "learning_rate": 0.00018688567117704742, "loss": 0.8564, "step": 16530 }, { "contrastive_loss": 3.812255859375, "epoch": 1.9596917605216362, "mse_loss": 0.04543602094054222, "step": 16530 }, { "epoch": 1.9608772969768822, "grad_norm": 0.39453125, "learning_rate": 0.00018686519943449125, "loss": 0.8463, "step": 16540 }, { "contrastive_loss": 3.8856201171875, "epoch": 1.9608772969768822, "mse_loss": 0.04625121131539345, "step": 16540 }, { "epoch": 1.9620628334321282, "grad_norm": 0.416015625, "learning_rate": 0.00018684471284904827, "loss": 0.8492, "step": 16550 }, { "contrastive_loss": 3.906005859375, "epoch": 1.9620628334321282, "mse_loss": 0.053314048796892166, "step": 16550 }, { "epoch": 1.9632483698873742, "grad_norm": 0.447265625, "learning_rate": 0.00018682421142421907, "loss": 0.8476, "step": 16560 }, { "contrastive_loss": 3.8870849609375, "epoch": 1.9632483698873742, "mse_loss": 0.10700688511133194, "step": 16560 }, { "epoch": 1.9644339063426202, "grad_norm": 0.55859375, "learning_rate": 0.00018680369516350676, "loss": 0.8521, "step": 16570 }, { "contrastive_loss": 3.7886962890625, "epoch": 1.9644339063426202, "mse_loss": 0.07208289206027985, "step": 16570 }, { "epoch": 1.9656194427978662, "grad_norm": 0.484375, "learning_rate": 0.00018678316407041707, "loss": 0.8424, "step": 16580 }, { "contrastive_loss": 3.876220703125, "epoch": 1.9656194427978662, "mse_loss": 0.069124735891819, "step": 16580 }, { "epoch": 1.9668049792531122, "grad_norm": 0.375, "learning_rate": 0.00018676261814845816, "loss": 0.8472, "step": 16590 }, { "contrastive_loss": 3.9962158203125, "epoch": 1.9668049792531122, "mse_loss": 0.05977558344602585, "step": 16590 }, { "epoch": 1.9679905157083581, "grad_norm": 0.50390625, "learning_rate": 0.00018674205740114075, "loss": 0.8461, "step": 16600 }, { "contrastive_loss": 3.982666015625, "epoch": 1.9679905157083581, "mse_loss": 0.04512954503297806, "step": 16600 }, { "epoch": 1.9691760521636041, "grad_norm": 0.58203125, "learning_rate": 0.00018672148183197814, "loss": 0.8344, "step": 16610 }, { "contrastive_loss": 3.9129638671875, "epoch": 1.9691760521636041, "mse_loss": 0.05007680878043175, "step": 16610 }, { "epoch": 1.9703615886188501, "grad_norm": 0.46484375, "learning_rate": 0.0001867008914444861, "loss": 0.8432, "step": 16620 }, { "contrastive_loss": 4.04248046875, "epoch": 1.9703615886188501, "mse_loss": 0.062014561146497726, "step": 16620 }, { "epoch": 1.9715471250740961, "grad_norm": 0.408203125, "learning_rate": 0.00018668028624218303, "loss": 0.845, "step": 16630 }, { "contrastive_loss": 3.827392578125, "epoch": 1.9715471250740961, "mse_loss": 0.09125407785177231, "step": 16630 }, { "epoch": 1.9727326615293421, "grad_norm": 0.423828125, "learning_rate": 0.00018665966622858973, "loss": 0.8381, "step": 16640 }, { "contrastive_loss": 4.0323486328125, "epoch": 1.9727326615293421, "mse_loss": 0.06371597200632095, "step": 16640 }, { "epoch": 1.9739181979845881, "grad_norm": 0.51953125, "learning_rate": 0.0001866390314072296, "loss": 0.8602, "step": 16650 }, { "contrastive_loss": 3.8404541015625, "epoch": 1.9739181979845881, "mse_loss": 0.08486612886190414, "step": 16650 }, { "epoch": 1.9751037344398341, "grad_norm": 0.470703125, "learning_rate": 0.00018661838178162863, "loss": 0.8395, "step": 16660 }, { "contrastive_loss": 3.8408203125, "epoch": 1.9751037344398341, "mse_loss": 0.08886067569255829, "step": 16660 }, { "epoch": 1.97628927089508, "grad_norm": 0.390625, "learning_rate": 0.0001865977173553152, "loss": 0.8454, "step": 16670 }, { "contrastive_loss": 3.88525390625, "epoch": 1.97628927089508, "mse_loss": 0.07128873467445374, "step": 16670 }, { "epoch": 1.977474807350326, "grad_norm": 0.431640625, "learning_rate": 0.00018657703813182032, "loss": 0.8428, "step": 16680 }, { "contrastive_loss": 3.8011474609375, "epoch": 1.977474807350326, "mse_loss": 0.062466807663440704, "step": 16680 }, { "epoch": 1.978660343805572, "grad_norm": 0.5859375, "learning_rate": 0.0001865563441146775, "loss": 0.8465, "step": 16690 }, { "contrastive_loss": 3.7977294921875, "epoch": 1.978660343805572, "mse_loss": 0.07909712940454483, "step": 16690 }, { "epoch": 1.979845880260818, "grad_norm": 0.423828125, "learning_rate": 0.00018653563530742284, "loss": 0.8525, "step": 16700 }, { "contrastive_loss": 3.893310546875, "epoch": 1.979845880260818, "mse_loss": 0.05790535733103752, "step": 16700 }, { "epoch": 1.981031416716064, "grad_norm": 0.515625, "learning_rate": 0.00018651491171359482, "loss": 0.8421, "step": 16710 }, { "contrastive_loss": 3.945556640625, "epoch": 1.981031416716064, "mse_loss": 0.04809991270303726, "step": 16710 }, { "epoch": 1.98221695317131, "grad_norm": 0.458984375, "learning_rate": 0.0001864941733367346, "loss": 0.8429, "step": 16720 }, { "contrastive_loss": 3.94677734375, "epoch": 1.98221695317131, "mse_loss": 0.061103496700525284, "step": 16720 }, { "epoch": 1.983402489626556, "grad_norm": 0.5390625, "learning_rate": 0.00018647342018038575, "loss": 0.843, "step": 16730 }, { "contrastive_loss": 4.088623046875, "epoch": 1.983402489626556, "mse_loss": 0.06481283158063889, "step": 16730 }, { "epoch": 1.984588026081802, "grad_norm": 0.349609375, "learning_rate": 0.0001864526522480945, "loss": 0.842, "step": 16740 }, { "contrastive_loss": 3.99462890625, "epoch": 1.984588026081802, "mse_loss": 0.09086205810308456, "step": 16740 }, { "epoch": 1.985773562537048, "grad_norm": 0.484375, "learning_rate": 0.00018643186954340942, "loss": 0.8519, "step": 16750 }, { "contrastive_loss": 3.9052734375, "epoch": 1.985773562537048, "mse_loss": 0.07476348429918289, "step": 16750 }, { "epoch": 1.986959098992294, "grad_norm": 0.5, "learning_rate": 0.00018641107206988176, "loss": 0.8481, "step": 16760 }, { "contrastive_loss": 3.9619140625, "epoch": 1.986959098992294, "mse_loss": 0.05239927023649216, "step": 16760 }, { "epoch": 1.98814463544754, "grad_norm": 0.484375, "learning_rate": 0.00018639025983106523, "loss": 0.8501, "step": 16770 }, { "contrastive_loss": 3.9996337890625, "epoch": 1.98814463544754, "mse_loss": 0.06207878142595291, "step": 16770 }, { "epoch": 1.989330171902786, "grad_norm": 0.50390625, "learning_rate": 0.00018636943283051606, "loss": 0.8493, "step": 16780 }, { "contrastive_loss": 4.093505859375, "epoch": 1.989330171902786, "mse_loss": 0.07365696877241135, "step": 16780 }, { "epoch": 1.990515708358032, "grad_norm": 0.4609375, "learning_rate": 0.00018634859107179304, "loss": 0.8491, "step": 16790 }, { "contrastive_loss": 3.970458984375, "epoch": 1.990515708358032, "mse_loss": 0.05122145637869835, "step": 16790 }, { "epoch": 1.991701244813278, "grad_norm": 0.384765625, "learning_rate": 0.00018632773455845746, "loss": 0.8534, "step": 16800 }, { "contrastive_loss": 3.9134521484375, "epoch": 1.991701244813278, "mse_loss": 0.07520950585603714, "step": 16800 }, { "epoch": 1.992886781268524, "grad_norm": 0.51953125, "learning_rate": 0.00018630686329407312, "loss": 0.8515, "step": 16810 }, { "contrastive_loss": 3.8817138671875, "epoch": 1.992886781268524, "mse_loss": 0.07467729598283768, "step": 16810 }, { "epoch": 1.99407231772377, "grad_norm": 0.35546875, "learning_rate": 0.00018628597728220631, "loss": 0.8446, "step": 16820 }, { "contrastive_loss": 3.9200439453125, "epoch": 1.99407231772377, "mse_loss": 0.06396615505218506, "step": 16820 }, { "epoch": 1.995257854179016, "grad_norm": 0.53125, "learning_rate": 0.0001862650765264259, "loss": 0.8441, "step": 16830 }, { "contrastive_loss": 4.01171875, "epoch": 1.995257854179016, "mse_loss": 0.07585059851408005, "step": 16830 }, { "epoch": 1.996443390634262, "grad_norm": 0.400390625, "learning_rate": 0.0001862441610303033, "loss": 0.8456, "step": 16840 }, { "contrastive_loss": 3.7906494140625, "epoch": 1.996443390634262, "mse_loss": 0.047894496470689774, "step": 16840 }, { "epoch": 1.997628927089508, "grad_norm": 0.337890625, "learning_rate": 0.00018622323079741236, "loss": 0.8471, "step": 16850 }, { "contrastive_loss": 3.8062744140625, "epoch": 1.997628927089508, "mse_loss": 0.06947987526655197, "step": 16850 }, { "epoch": 1.998814463544754, "grad_norm": 0.3984375, "learning_rate": 0.00018620228583132947, "loss": 0.8393, "step": 16860 }, { "contrastive_loss": 3.9481201171875, "epoch": 1.998814463544754, "mse_loss": 0.07267407327890396, "step": 16860 }, { "epoch": 2.0, "grad_norm": 0.41015625, "learning_rate": 0.00018618132613563358, "loss": 0.8414, "step": 16870 }, { "contrastive_loss": 3.966552734375, "epoch": 2.0, "mse_loss": 0.09948260337114334, "step": 16870 }, { "epoch": 2.001185536455246, "grad_norm": 0.46875, "learning_rate": 0.00018616035171390612, "loss": 0.8563, "step": 16880 }, { "contrastive_loss": 3.810546875, "epoch": 2.001185536455246, "mse_loss": 0.06598932296037674, "step": 16880 }, { "epoch": 2.002371072910492, "grad_norm": 0.447265625, "learning_rate": 0.00018613936256973103, "loss": 0.8434, "step": 16890 }, { "contrastive_loss": 3.80615234375, "epoch": 2.002371072910492, "mse_loss": 0.062473833560943604, "step": 16890 }, { "epoch": 2.003556609365738, "grad_norm": 0.330078125, "learning_rate": 0.0001861183587066948, "loss": 0.8409, "step": 16900 }, { "contrastive_loss": 4.042236328125, "epoch": 2.003556609365738, "mse_loss": 0.08807928115129471, "step": 16900 }, { "epoch": 2.004742145820984, "grad_norm": 0.4296875, "learning_rate": 0.00018609734012838642, "loss": 0.8465, "step": 16910 }, { "contrastive_loss": 3.8389892578125, "epoch": 2.004742145820984, "mse_loss": 0.06862079352140427, "step": 16910 }, { "epoch": 2.00592768227623, "grad_norm": 0.423828125, "learning_rate": 0.00018607630683839735, "loss": 0.8273, "step": 16920 }, { "contrastive_loss": 3.8712158203125, "epoch": 2.00592768227623, "mse_loss": 0.050781942903995514, "step": 16920 }, { "epoch": 2.007113218731476, "grad_norm": 0.455078125, "learning_rate": 0.00018605525884032167, "loss": 0.8353, "step": 16930 }, { "contrastive_loss": 4.1307373046875, "epoch": 2.007113218731476, "mse_loss": 0.06516647338867188, "step": 16930 }, { "epoch": 2.008298755186722, "grad_norm": 0.427734375, "learning_rate": 0.00018603419613775585, "loss": 0.8555, "step": 16940 }, { "contrastive_loss": 3.9638671875, "epoch": 2.008298755186722, "mse_loss": 0.0831185132265091, "step": 16940 }, { "epoch": 2.009484291641968, "grad_norm": 0.359375, "learning_rate": 0.00018601311873429896, "loss": 0.8307, "step": 16950 }, { "contrastive_loss": 3.7652587890625, "epoch": 2.009484291641968, "mse_loss": 0.05715686082839966, "step": 16950 }, { "epoch": 2.010669828097214, "grad_norm": 0.404296875, "learning_rate": 0.00018599202663355255, "loss": 0.8389, "step": 16960 }, { "contrastive_loss": 3.9080810546875, "epoch": 2.010669828097214, "mse_loss": 0.07195223122835159, "step": 16960 }, { "epoch": 2.01185536455246, "grad_norm": 0.390625, "learning_rate": 0.00018597091983912065, "loss": 0.8439, "step": 16970 }, { "contrastive_loss": 3.878662109375, "epoch": 2.01185536455246, "mse_loss": 0.06124710291624069, "step": 16970 }, { "epoch": 2.013040901007706, "grad_norm": 0.369140625, "learning_rate": 0.00018594979835460986, "loss": 0.8385, "step": 16980 }, { "contrastive_loss": 3.81298828125, "epoch": 2.013040901007706, "mse_loss": 0.07496337592601776, "step": 16980 }, { "epoch": 2.014226437462952, "grad_norm": 0.359375, "learning_rate": 0.00018592866218362927, "loss": 0.8446, "step": 16990 }, { "contrastive_loss": 3.7984619140625, "epoch": 2.014226437462952, "mse_loss": 0.06408767402172089, "step": 16990 }, { "epoch": 2.015411973918198, "grad_norm": 0.451171875, "learning_rate": 0.00018590751132979046, "loss": 0.8549, "step": 17000 }, { "contrastive_loss": 3.7840576171875, "epoch": 2.015411973918198, "mse_loss": 0.05678202956914902, "step": 17000 }, { "epoch": 2.016597510373444, "grad_norm": 0.416015625, "learning_rate": 0.00018588634579670758, "loss": 0.8443, "step": 17010 }, { "contrastive_loss": 3.86962890625, "epoch": 2.016597510373444, "mse_loss": 0.07705974578857422, "step": 17010 }, { "epoch": 2.01778304682869, "grad_norm": 0.515625, "learning_rate": 0.00018586516558799718, "loss": 0.84, "step": 17020 }, { "contrastive_loss": 3.834228515625, "epoch": 2.01778304682869, "mse_loss": 0.06606994569301605, "step": 17020 }, { "epoch": 2.018968583283936, "grad_norm": 0.4921875, "learning_rate": 0.00018584397070727838, "loss": 0.8542, "step": 17030 }, { "contrastive_loss": 3.959228515625, "epoch": 2.018968583283936, "mse_loss": 0.07174008339643478, "step": 17030 }, { "epoch": 2.020154119739182, "grad_norm": 0.50390625, "learning_rate": 0.00018582276115817282, "loss": 0.834, "step": 17040 }, { "contrastive_loss": 3.8353271484375, "epoch": 2.020154119739182, "mse_loss": 0.051748037338256836, "step": 17040 }, { "epoch": 2.021339656194428, "grad_norm": 0.60546875, "learning_rate": 0.00018580153694430467, "loss": 0.8389, "step": 17050 }, { "contrastive_loss": 3.9061279296875, "epoch": 2.021339656194428, "mse_loss": 0.061856068670749664, "step": 17050 }, { "epoch": 2.022525192649674, "grad_norm": 0.43359375, "learning_rate": 0.0001857802980693005, "loss": 0.8481, "step": 17060 }, { "contrastive_loss": 3.8218994140625, "epoch": 2.022525192649674, "mse_loss": 0.036667514592409134, "step": 17060 }, { "epoch": 2.02371072910492, "grad_norm": 0.39453125, "learning_rate": 0.0001857590445367895, "loss": 0.8433, "step": 17070 }, { "contrastive_loss": 3.9359130859375, "epoch": 2.02371072910492, "mse_loss": 0.11859338730573654, "step": 17070 }, { "epoch": 2.024896265560166, "grad_norm": 0.4296875, "learning_rate": 0.0001857377763504033, "loss": 0.85, "step": 17080 }, { "contrastive_loss": 3.9381103515625, "epoch": 2.024896265560166, "mse_loss": 0.06343091279268265, "step": 17080 }, { "epoch": 2.026081802015412, "grad_norm": 0.41796875, "learning_rate": 0.00018571649351377606, "loss": 0.8372, "step": 17090 }, { "contrastive_loss": 4.1025390625, "epoch": 2.026081802015412, "mse_loss": 0.06576856970787048, "step": 17090 }, { "epoch": 2.027267338470658, "grad_norm": 0.3828125, "learning_rate": 0.0001856951960305444, "loss": 0.8479, "step": 17100 }, { "contrastive_loss": 4.0140380859375, "epoch": 2.027267338470658, "mse_loss": 0.06899291276931763, "step": 17100 }, { "epoch": 2.028452874925904, "grad_norm": 0.6484375, "learning_rate": 0.00018567388390434758, "loss": 0.8542, "step": 17110 }, { "contrastive_loss": 3.95849609375, "epoch": 2.028452874925904, "mse_loss": 0.05332678556442261, "step": 17110 }, { "epoch": 2.02963841138115, "grad_norm": 0.478515625, "learning_rate": 0.00018565255713882712, "loss": 0.8477, "step": 17120 }, { "contrastive_loss": 3.79931640625, "epoch": 2.02963841138115, "mse_loss": 0.07110845297574997, "step": 17120 }, { "epoch": 2.030823947836396, "grad_norm": 0.458984375, "learning_rate": 0.00018563121573762726, "loss": 0.8522, "step": 17130 }, { "contrastive_loss": 3.8270263671875, "epoch": 2.030823947836396, "mse_loss": 0.06490720063447952, "step": 17130 }, { "epoch": 2.032009484291642, "grad_norm": 0.44140625, "learning_rate": 0.00018560985970439466, "loss": 0.8562, "step": 17140 }, { "contrastive_loss": 3.85107421875, "epoch": 2.032009484291642, "mse_loss": 0.056295592337846756, "step": 17140 }, { "epoch": 2.033195020746888, "grad_norm": 0.4296875, "learning_rate": 0.00018558848904277848, "loss": 0.8476, "step": 17150 }, { "contrastive_loss": 3.872802734375, "epoch": 2.033195020746888, "mse_loss": 0.0697101280093193, "step": 17150 }, { "epoch": 2.034380557202134, "grad_norm": 0.44140625, "learning_rate": 0.00018556710375643035, "loss": 0.8463, "step": 17160 }, { "contrastive_loss": 4.099365234375, "epoch": 2.034380557202134, "mse_loss": 0.08117057383060455, "step": 17160 }, { "epoch": 2.03556609365738, "grad_norm": 0.474609375, "learning_rate": 0.00018554570384900448, "loss": 0.8494, "step": 17170 }, { "contrastive_loss": 3.84765625, "epoch": 2.03556609365738, "mse_loss": 0.05201907828450203, "step": 17170 }, { "epoch": 2.036751630112626, "grad_norm": 0.474609375, "learning_rate": 0.0001855242893241575, "loss": 0.8403, "step": 17180 }, { "contrastive_loss": 3.853515625, "epoch": 2.036751630112626, "mse_loss": 0.04548308998346329, "step": 17180 }, { "epoch": 2.037937166567872, "grad_norm": 0.4765625, "learning_rate": 0.00018550286018554854, "loss": 0.8458, "step": 17190 }, { "contrastive_loss": 3.878662109375, "epoch": 2.037937166567872, "mse_loss": 0.053761791437864304, "step": 17190 }, { "epoch": 2.039122703023118, "grad_norm": 0.63671875, "learning_rate": 0.00018548141643683929, "loss": 0.8426, "step": 17200 }, { "contrastive_loss": 3.8814697265625, "epoch": 2.039122703023118, "mse_loss": 0.1050848439335823, "step": 17200 }, { "epoch": 2.040308239478364, "grad_norm": 0.439453125, "learning_rate": 0.0001854599580816939, "loss": 0.8384, "step": 17210 }, { "contrastive_loss": 3.8603515625, "epoch": 2.040308239478364, "mse_loss": 0.08325202018022537, "step": 17210 }, { "epoch": 2.04149377593361, "grad_norm": 0.486328125, "learning_rate": 0.00018543848512377902, "loss": 0.8439, "step": 17220 }, { "contrastive_loss": 3.926025390625, "epoch": 2.04149377593361, "mse_loss": 0.06620723754167557, "step": 17220 }, { "epoch": 2.042679312388856, "grad_norm": 0.57421875, "learning_rate": 0.00018541699756676377, "loss": 0.8406, "step": 17230 }, { "contrastive_loss": 3.8748779296875, "epoch": 2.042679312388856, "mse_loss": 0.057721398770809174, "step": 17230 }, { "epoch": 2.043864848844102, "grad_norm": 0.42578125, "learning_rate": 0.00018539549541431982, "loss": 0.8361, "step": 17240 }, { "contrastive_loss": 3.9898681640625, "epoch": 2.043864848844102, "mse_loss": 0.057903025299310684, "step": 17240 }, { "epoch": 2.045050385299348, "grad_norm": 0.474609375, "learning_rate": 0.00018537397867012122, "loss": 0.8489, "step": 17250 }, { "contrastive_loss": 3.8729248046875, "epoch": 2.045050385299348, "mse_loss": 0.050732772797346115, "step": 17250 }, { "epoch": 2.046235921754594, "grad_norm": 0.55859375, "learning_rate": 0.0001853524473378447, "loss": 0.8463, "step": 17260 }, { "contrastive_loss": 3.9005126953125, "epoch": 2.046235921754594, "mse_loss": 0.07092788070440292, "step": 17260 }, { "epoch": 2.04742145820984, "grad_norm": 0.5546875, "learning_rate": 0.0001853309014211693, "loss": 0.8503, "step": 17270 }, { "contrastive_loss": 3.8543701171875, "epoch": 2.04742145820984, "mse_loss": 0.08184868842363358, "step": 17270 }, { "epoch": 2.048606994665086, "grad_norm": 0.486328125, "learning_rate": 0.00018530934092377666, "loss": 0.8472, "step": 17280 }, { "contrastive_loss": 3.9993896484375, "epoch": 2.048606994665086, "mse_loss": 0.07216526567935944, "step": 17280 }, { "epoch": 2.0497925311203318, "grad_norm": 0.51171875, "learning_rate": 0.00018528776584935086, "loss": 0.8409, "step": 17290 }, { "contrastive_loss": 3.90673828125, "epoch": 2.0497925311203318, "mse_loss": 0.05396909639239311, "step": 17290 }, { "epoch": 2.0509780675755778, "grad_norm": 0.37109375, "learning_rate": 0.0001852661762015785, "loss": 0.8371, "step": 17300 }, { "contrastive_loss": 4.0321044921875, "epoch": 2.0509780675755778, "mse_loss": 0.05011597275733948, "step": 17300 }, { "epoch": 2.0521636040308238, "grad_norm": 0.392578125, "learning_rate": 0.00018524457198414867, "loss": 0.8442, "step": 17310 }, { "contrastive_loss": 3.86865234375, "epoch": 2.0521636040308238, "mse_loss": 0.06357506662607193, "step": 17310 }, { "epoch": 2.0533491404860698, "grad_norm": 0.458984375, "learning_rate": 0.00018522295320075294, "loss": 0.8415, "step": 17320 }, { "contrastive_loss": 3.8641357421875, "epoch": 2.0533491404860698, "mse_loss": 0.07055462896823883, "step": 17320 }, { "epoch": 2.0545346769413158, "grad_norm": 0.490234375, "learning_rate": 0.0001852013198550854, "loss": 0.8571, "step": 17330 }, { "contrastive_loss": 3.8681640625, "epoch": 2.0545346769413158, "mse_loss": 0.08095037937164307, "step": 17330 }, { "epoch": 2.0557202133965617, "grad_norm": 0.462890625, "learning_rate": 0.00018517967195084249, "loss": 0.8432, "step": 17340 }, { "contrastive_loss": 3.9195556640625, "epoch": 2.0557202133965617, "mse_loss": 0.05002770945429802, "step": 17340 }, { "epoch": 2.0569057498518077, "grad_norm": 0.474609375, "learning_rate": 0.00018515800949172334, "loss": 0.8452, "step": 17350 }, { "contrastive_loss": 3.7366943359375, "epoch": 2.0569057498518077, "mse_loss": 0.06132226064801216, "step": 17350 }, { "epoch": 2.0580912863070537, "grad_norm": 0.484375, "learning_rate": 0.00018513633248142943, "loss": 0.8496, "step": 17360 }, { "contrastive_loss": 3.876953125, "epoch": 2.0580912863070537, "mse_loss": 0.07117348164319992, "step": 17360 }, { "epoch": 2.0592768227622997, "grad_norm": 0.408203125, "learning_rate": 0.0001851146409236648, "loss": 0.8421, "step": 17370 }, { "contrastive_loss": 3.907470703125, "epoch": 2.0592768227622997, "mse_loss": 0.05915094166994095, "step": 17370 }, { "epoch": 2.0604623592175457, "grad_norm": 0.431640625, "learning_rate": 0.00018509293482213592, "loss": 0.8392, "step": 17380 }, { "contrastive_loss": 3.8878173828125, "epoch": 2.0604623592175457, "mse_loss": 0.07702425867319107, "step": 17380 }, { "epoch": 2.0616478956727917, "grad_norm": 0.490234375, "learning_rate": 0.00018507121418055177, "loss": 0.8333, "step": 17390 }, { "contrastive_loss": 3.90966796875, "epoch": 2.0616478956727917, "mse_loss": 0.05362413078546524, "step": 17390 }, { "epoch": 2.0628334321280377, "grad_norm": 0.55078125, "learning_rate": 0.00018504947900262384, "loss": 0.846, "step": 17400 }, { "contrastive_loss": 3.8812255859375, "epoch": 2.0628334321280377, "mse_loss": 0.07412797957658768, "step": 17400 }, { "epoch": 2.0640189685832837, "grad_norm": 0.5, "learning_rate": 0.00018502772929206604, "loss": 0.8477, "step": 17410 }, { "contrastive_loss": 3.825927734375, "epoch": 2.0640189685832837, "mse_loss": 0.05668988451361656, "step": 17410 }, { "epoch": 2.06520450503853, "grad_norm": 0.431640625, "learning_rate": 0.00018500596505259482, "loss": 0.8453, "step": 17420 }, { "contrastive_loss": 3.7572021484375, "epoch": 2.06520450503853, "mse_loss": 0.059964243322610855, "step": 17420 }, { "epoch": 2.066390041493776, "grad_norm": 0.75, "learning_rate": 0.00018498418628792908, "loss": 0.8494, "step": 17430 }, { "contrastive_loss": 3.945556640625, "epoch": 2.066390041493776, "mse_loss": 0.05380352959036827, "step": 17430 }, { "epoch": 2.067575577949022, "grad_norm": 0.435546875, "learning_rate": 0.00018496239300179026, "loss": 0.8407, "step": 17440 }, { "contrastive_loss": 3.833251953125, "epoch": 2.067575577949022, "mse_loss": 0.05346972122788429, "step": 17440 }, { "epoch": 2.068761114404268, "grad_norm": 0.486328125, "learning_rate": 0.00018494058519790215, "loss": 0.8408, "step": 17450 }, { "contrastive_loss": 3.83203125, "epoch": 2.068761114404268, "mse_loss": 0.061719994992017746, "step": 17450 }, { "epoch": 2.069946650859514, "grad_norm": 0.431640625, "learning_rate": 0.0001849187628799912, "loss": 0.8395, "step": 17460 }, { "contrastive_loss": 3.848876953125, "epoch": 2.069946650859514, "mse_loss": 0.053672369569540024, "step": 17460 }, { "epoch": 2.07113218731476, "grad_norm": 0.48046875, "learning_rate": 0.00018489692605178618, "loss": 0.8369, "step": 17470 }, { "contrastive_loss": 3.88330078125, "epoch": 2.07113218731476, "mse_loss": 0.07101990282535553, "step": 17470 }, { "epoch": 2.072317723770006, "grad_norm": 0.396484375, "learning_rate": 0.00018487507471701847, "loss": 0.8481, "step": 17480 }, { "contrastive_loss": 3.806640625, "epoch": 2.072317723770006, "mse_loss": 0.06258544325828552, "step": 17480 }, { "epoch": 2.073503260225252, "grad_norm": 0.3359375, "learning_rate": 0.0001848532088794218, "loss": 0.837, "step": 17490 }, { "contrastive_loss": 3.8511962890625, "epoch": 2.073503260225252, "mse_loss": 0.06927298754453659, "step": 17490 }, { "epoch": 2.074688796680498, "grad_norm": 0.4921875, "learning_rate": 0.00018483132854273248, "loss": 0.8525, "step": 17500 }, { "contrastive_loss": 3.775146484375, "epoch": 2.074688796680498, "mse_loss": 0.06340374797582626, "step": 17500 }, { "epoch": 2.075874333135744, "grad_norm": 0.390625, "learning_rate": 0.00018480943371068927, "loss": 0.8381, "step": 17510 }, { "contrastive_loss": 3.80224609375, "epoch": 2.075874333135744, "mse_loss": 0.06693430989980698, "step": 17510 }, { "epoch": 2.07705986959099, "grad_norm": 0.412109375, "learning_rate": 0.00018478752438703334, "loss": 0.8359, "step": 17520 }, { "contrastive_loss": 3.8787841796875, "epoch": 2.07705986959099, "mse_loss": 0.0662493035197258, "step": 17520 }, { "epoch": 2.078245406046236, "grad_norm": 0.41796875, "learning_rate": 0.0001847656005755085, "loss": 0.8323, "step": 17530 }, { "contrastive_loss": 3.8385009765625, "epoch": 2.078245406046236, "mse_loss": 0.08191879093647003, "step": 17530 }, { "epoch": 2.079430942501482, "grad_norm": 0.431640625, "learning_rate": 0.00018474366227986082, "loss": 0.8558, "step": 17540 }, { "contrastive_loss": 3.8822021484375, "epoch": 2.079430942501482, "mse_loss": 0.05147722363471985, "step": 17540 }, { "epoch": 2.080616478956728, "grad_norm": 0.48046875, "learning_rate": 0.00018472170950383903, "loss": 0.8489, "step": 17550 }, { "contrastive_loss": 4.0787353515625, "epoch": 2.080616478956728, "mse_loss": 0.07685583829879761, "step": 17550 }, { "epoch": 2.081802015411974, "grad_norm": 0.443359375, "learning_rate": 0.00018469974225119418, "loss": 0.8499, "step": 17560 }, { "contrastive_loss": 3.8109130859375, "epoch": 2.081802015411974, "mse_loss": 0.045984864234924316, "step": 17560 }, { "epoch": 2.08298755186722, "grad_norm": 0.453125, "learning_rate": 0.00018467776052567998, "loss": 0.8328, "step": 17570 }, { "contrastive_loss": 3.9207763671875, "epoch": 2.08298755186722, "mse_loss": 0.08890807628631592, "step": 17570 }, { "epoch": 2.084173088322466, "grad_norm": 0.408203125, "learning_rate": 0.00018465576433105237, "loss": 0.8523, "step": 17580 }, { "contrastive_loss": 3.8524169921875, "epoch": 2.084173088322466, "mse_loss": 0.0531122088432312, "step": 17580 }, { "epoch": 2.085358624777712, "grad_norm": 0.369140625, "learning_rate": 0.00018463375367107004, "loss": 0.8323, "step": 17590 }, { "contrastive_loss": 3.8662109375, "epoch": 2.085358624777712, "mse_loss": 0.06178228184580803, "step": 17590 }, { "epoch": 2.086544161232958, "grad_norm": 0.34765625, "learning_rate": 0.00018461172854949395, "loss": 0.8361, "step": 17600 }, { "contrastive_loss": 3.88525390625, "epoch": 2.086544161232958, "mse_loss": 0.045755770057439804, "step": 17600 }, { "epoch": 2.087729697688204, "grad_norm": 0.361328125, "learning_rate": 0.00018458968897008758, "loss": 0.8342, "step": 17610 }, { "contrastive_loss": 3.8189697265625, "epoch": 2.087729697688204, "mse_loss": 0.05578397959470749, "step": 17610 }, { "epoch": 2.08891523414345, "grad_norm": 0.34765625, "learning_rate": 0.00018456763493661686, "loss": 0.8352, "step": 17620 }, { "contrastive_loss": 3.8603515625, "epoch": 2.08891523414345, "mse_loss": 0.058053720742464066, "step": 17620 }, { "epoch": 2.090100770598696, "grad_norm": 0.4296875, "learning_rate": 0.00018454556645285027, "loss": 0.8385, "step": 17630 }, { "contrastive_loss": 3.86669921875, "epoch": 2.090100770598696, "mse_loss": 0.06375057250261307, "step": 17630 }, { "epoch": 2.091286307053942, "grad_norm": 0.5390625, "learning_rate": 0.00018452348352255874, "loss": 0.8383, "step": 17640 }, { "contrastive_loss": 3.734375, "epoch": 2.091286307053942, "mse_loss": 0.07561404258012772, "step": 17640 }, { "epoch": 2.092471843509188, "grad_norm": 0.40625, "learning_rate": 0.0001845013861495156, "loss": 0.8362, "step": 17650 }, { "contrastive_loss": 3.8211669921875, "epoch": 2.092471843509188, "mse_loss": 0.07531131058931351, "step": 17650 }, { "epoch": 2.093657379964434, "grad_norm": 0.5859375, "learning_rate": 0.00018447927433749663, "loss": 0.854, "step": 17660 }, { "contrastive_loss": 3.837890625, "epoch": 2.093657379964434, "mse_loss": 0.06291048973798752, "step": 17660 }, { "epoch": 2.09484291641968, "grad_norm": 0.427734375, "learning_rate": 0.00018445714809028023, "loss": 0.8512, "step": 17670 }, { "contrastive_loss": 3.832763671875, "epoch": 2.09484291641968, "mse_loss": 0.059109438210725784, "step": 17670 }, { "epoch": 2.096028452874926, "grad_norm": 0.484375, "learning_rate": 0.0001844350074116471, "loss": 0.8409, "step": 17680 }, { "contrastive_loss": 4.0162353515625, "epoch": 2.096028452874926, "mse_loss": 0.06663314998149872, "step": 17680 }, { "epoch": 2.097213989330172, "grad_norm": 0.4140625, "learning_rate": 0.00018441285230538055, "loss": 0.8418, "step": 17690 }, { "contrastive_loss": 3.8338623046875, "epoch": 2.097213989330172, "mse_loss": 0.09824223071336746, "step": 17690 }, { "epoch": 2.098399525785418, "grad_norm": 0.4765625, "learning_rate": 0.00018439068277526622, "loss": 0.8538, "step": 17700 }, { "contrastive_loss": 4.0130615234375, "epoch": 2.098399525785418, "mse_loss": 0.06717853248119354, "step": 17700 }, { "epoch": 2.099585062240664, "grad_norm": 0.345703125, "learning_rate": 0.00018436849882509226, "loss": 0.8344, "step": 17710 }, { "contrastive_loss": 3.9564208984375, "epoch": 2.099585062240664, "mse_loss": 0.06281325966119766, "step": 17710 }, { "epoch": 2.10077059869591, "grad_norm": 0.41015625, "learning_rate": 0.00018434630045864936, "loss": 0.8413, "step": 17720 }, { "contrastive_loss": 3.9617919921875, "epoch": 2.10077059869591, "mse_loss": 0.08577414602041245, "step": 17720 }, { "epoch": 2.101956135151156, "grad_norm": 0.3984375, "learning_rate": 0.00018432408767973056, "loss": 0.8439, "step": 17730 }, { "contrastive_loss": 3.805908203125, "epoch": 2.101956135151156, "mse_loss": 0.07550973445177078, "step": 17730 }, { "epoch": 2.103141671606402, "grad_norm": 0.341796875, "learning_rate": 0.00018430186049213148, "loss": 0.8396, "step": 17740 }, { "contrastive_loss": 3.9171142578125, "epoch": 2.103141671606402, "mse_loss": 0.06153064966201782, "step": 17740 }, { "epoch": 2.104327208061648, "grad_norm": 0.486328125, "learning_rate": 0.00018427961889965012, "loss": 0.8414, "step": 17750 }, { "contrastive_loss": 3.95703125, "epoch": 2.104327208061648, "mse_loss": 0.055552806705236435, "step": 17750 }, { "epoch": 2.105512744516894, "grad_norm": 0.458984375, "learning_rate": 0.00018425736290608692, "loss": 0.8493, "step": 17760 }, { "contrastive_loss": 3.8427734375, "epoch": 2.105512744516894, "mse_loss": 0.08072994649410248, "step": 17760 }, { "epoch": 2.10669828097214, "grad_norm": 0.470703125, "learning_rate": 0.00018423509251524483, "loss": 0.8406, "step": 17770 }, { "contrastive_loss": 3.8802490234375, "epoch": 2.10669828097214, "mse_loss": 0.054184239357709885, "step": 17770 }, { "epoch": 2.107883817427386, "grad_norm": 0.6328125, "learning_rate": 0.00018421280773092927, "loss": 0.8549, "step": 17780 }, { "contrastive_loss": 3.8221435546875, "epoch": 2.107883817427386, "mse_loss": 0.0734713226556778, "step": 17780 }, { "epoch": 2.109069353882632, "grad_norm": 0.58203125, "learning_rate": 0.0001841905085569481, "loss": 0.8409, "step": 17790 }, { "contrastive_loss": 3.797607421875, "epoch": 2.109069353882632, "mse_loss": 0.06818141788244247, "step": 17790 }, { "epoch": 2.110254890337878, "grad_norm": 0.5, "learning_rate": 0.00018416819499711165, "loss": 0.8387, "step": 17800 }, { "contrastive_loss": 3.916748046875, "epoch": 2.110254890337878, "mse_loss": 0.0662008598446846, "step": 17800 }, { "epoch": 2.111440426793124, "grad_norm": 0.3984375, "learning_rate": 0.00018414586705523266, "loss": 0.8479, "step": 17810 }, { "contrastive_loss": 3.8612060546875, "epoch": 2.111440426793124, "mse_loss": 0.0774669274687767, "step": 17810 }, { "epoch": 2.11262596324837, "grad_norm": 0.5078125, "learning_rate": 0.00018412352473512638, "loss": 0.8388, "step": 17820 }, { "contrastive_loss": 3.9012451171875, "epoch": 2.11262596324837, "mse_loss": 0.06083710119128227, "step": 17820 }, { "epoch": 2.113811499703616, "grad_norm": 0.4921875, "learning_rate": 0.0001841011680406105, "loss": 0.8456, "step": 17830 }, { "contrastive_loss": 3.8065185546875, "epoch": 2.113811499703616, "mse_loss": 0.06763824075460434, "step": 17830 }, { "epoch": 2.114997036158862, "grad_norm": 0.55859375, "learning_rate": 0.00018407879697550518, "loss": 0.8522, "step": 17840 }, { "contrastive_loss": 3.9522705078125, "epoch": 2.114997036158862, "mse_loss": 0.047016970813274384, "step": 17840 }, { "epoch": 2.116182572614108, "grad_norm": 0.458984375, "learning_rate": 0.00018405641154363304, "loss": 0.8482, "step": 17850 }, { "contrastive_loss": 3.865234375, "epoch": 2.116182572614108, "mse_loss": 0.07702236622571945, "step": 17850 }, { "epoch": 2.117368109069354, "grad_norm": 0.453125, "learning_rate": 0.00018403401174881906, "loss": 0.8354, "step": 17860 }, { "contrastive_loss": 3.9132080078125, "epoch": 2.117368109069354, "mse_loss": 0.06362660229206085, "step": 17860 }, { "epoch": 2.1185536455246, "grad_norm": 0.51953125, "learning_rate": 0.00018401159759489087, "loss": 0.8378, "step": 17870 }, { "contrastive_loss": 3.944091796875, "epoch": 2.1185536455246, "mse_loss": 0.06927190721035004, "step": 17870 }, { "epoch": 2.119739181979846, "grad_norm": 0.490234375, "learning_rate": 0.00018398916908567836, "loss": 0.8474, "step": 17880 }, { "contrastive_loss": 3.845947265625, "epoch": 2.119739181979846, "mse_loss": 0.07386680692434311, "step": 17880 }, { "epoch": 2.120924718435092, "grad_norm": 0.416015625, "learning_rate": 0.00018396672622501394, "loss": 0.8397, "step": 17890 }, { "contrastive_loss": 3.9991455078125, "epoch": 2.120924718435092, "mse_loss": 0.06657474488019943, "step": 17890 }, { "epoch": 2.122110254890338, "grad_norm": 0.4921875, "learning_rate": 0.00018394426901673251, "loss": 0.8384, "step": 17900 }, { "contrastive_loss": 3.9945068359375, "epoch": 2.122110254890338, "mse_loss": 0.06964009255170822, "step": 17900 }, { "epoch": 2.123295791345584, "grad_norm": 0.5078125, "learning_rate": 0.0001839217974646714, "loss": 0.8417, "step": 17910 }, { "contrastive_loss": 3.939697265625, "epoch": 2.123295791345584, "mse_loss": 0.06957656890153885, "step": 17910 }, { "epoch": 2.12448132780083, "grad_norm": 0.546875, "learning_rate": 0.00018389931157267034, "loss": 0.8458, "step": 17920 }, { "contrastive_loss": 3.9267578125, "epoch": 2.12448132780083, "mse_loss": 0.09610145539045334, "step": 17920 }, { "epoch": 2.125666864256076, "grad_norm": 0.443359375, "learning_rate": 0.00018387681134457163, "loss": 0.8459, "step": 17930 }, { "contrastive_loss": 3.848388671875, "epoch": 2.125666864256076, "mse_loss": 0.10429532825946808, "step": 17930 }, { "epoch": 2.126852400711322, "grad_norm": 0.416015625, "learning_rate": 0.00018385429678421987, "loss": 0.8432, "step": 17940 }, { "contrastive_loss": 3.8555908203125, "epoch": 2.126852400711322, "mse_loss": 0.062098849564790726, "step": 17940 }, { "epoch": 2.128037937166568, "grad_norm": 0.349609375, "learning_rate": 0.0001838317678954622, "loss": 0.8427, "step": 17950 }, { "contrastive_loss": 3.9593505859375, "epoch": 2.128037937166568, "mse_loss": 0.06470537930727005, "step": 17950 }, { "epoch": 2.129223473621814, "grad_norm": 0.359375, "learning_rate": 0.00018380922468214821, "loss": 0.8322, "step": 17960 }, { "contrastive_loss": 3.8623046875, "epoch": 2.129223473621814, "mse_loss": 0.07618939876556396, "step": 17960 }, { "epoch": 2.13040901007706, "grad_norm": 0.51953125, "learning_rate": 0.00018378666714812992, "loss": 0.8434, "step": 17970 }, { "contrastive_loss": 3.943359375, "epoch": 2.13040901007706, "mse_loss": 0.08187726885080338, "step": 17970 }, { "epoch": 2.131594546532306, "grad_norm": 0.4140625, "learning_rate": 0.00018376409529726178, "loss": 0.8444, "step": 17980 }, { "contrastive_loss": 3.9993896484375, "epoch": 2.131594546532306, "mse_loss": 0.05586022511124611, "step": 17980 }, { "epoch": 2.132780082987552, "grad_norm": 0.3984375, "learning_rate": 0.00018374150913340066, "loss": 0.8419, "step": 17990 }, { "contrastive_loss": 3.837646484375, "epoch": 2.132780082987552, "mse_loss": 0.07042376697063446, "step": 17990 }, { "epoch": 2.133965619442798, "grad_norm": 0.421875, "learning_rate": 0.000183718908660406, "loss": 0.8376, "step": 18000 }, { "contrastive_loss": 3.8990478515625, "epoch": 2.133965619442798, "mse_loss": 0.09297336637973785, "step": 18000 }, { "epoch": 2.135151155898044, "grad_norm": 0.5, "learning_rate": 0.0001836962938821396, "loss": 0.8467, "step": 18010 }, { "contrastive_loss": 3.90625, "epoch": 2.135151155898044, "mse_loss": 0.09975927323102951, "step": 18010 }, { "epoch": 2.13633669235329, "grad_norm": 0.38671875, "learning_rate": 0.00018367366480246563, "loss": 0.836, "step": 18020 }, { "contrastive_loss": 3.8594970703125, "epoch": 2.13633669235329, "mse_loss": 0.05960714444518089, "step": 18020 }, { "epoch": 2.137522228808536, "grad_norm": 0.404296875, "learning_rate": 0.00018365102142525082, "loss": 0.8355, "step": 18030 }, { "contrastive_loss": 3.8824462890625, "epoch": 2.137522228808536, "mse_loss": 0.0780029147863388, "step": 18030 }, { "epoch": 2.138707765263782, "grad_norm": 0.490234375, "learning_rate": 0.00018362836375436436, "loss": 0.8398, "step": 18040 }, { "contrastive_loss": 3.7763671875, "epoch": 2.138707765263782, "mse_loss": 0.05631891265511513, "step": 18040 }, { "epoch": 2.139893301719028, "grad_norm": 0.42578125, "learning_rate": 0.00018360569179367775, "loss": 0.8457, "step": 18050 }, { "contrastive_loss": 3.85205078125, "epoch": 2.139893301719028, "mse_loss": 0.06412656605243683, "step": 18050 }, { "epoch": 2.141078838174274, "grad_norm": 0.3671875, "learning_rate": 0.000183583005547065, "loss": 0.8377, "step": 18060 }, { "contrastive_loss": 3.86669921875, "epoch": 2.141078838174274, "mse_loss": 0.07456982135772705, "step": 18060 }, { "epoch": 2.14226437462952, "grad_norm": 0.45703125, "learning_rate": 0.00018356030501840266, "loss": 0.8397, "step": 18070 }, { "contrastive_loss": 3.8997802734375, "epoch": 2.14226437462952, "mse_loss": 0.059875670820474625, "step": 18070 }, { "epoch": 2.143449911084766, "grad_norm": 0.47265625, "learning_rate": 0.00018353759021156953, "loss": 0.8409, "step": 18080 }, { "contrastive_loss": 3.80908203125, "epoch": 2.143449911084766, "mse_loss": 0.08129845559597015, "step": 18080 }, { "epoch": 2.144635447540012, "grad_norm": 0.4140625, "learning_rate": 0.000183514861130447, "loss": 0.836, "step": 18090 }, { "contrastive_loss": 3.891357421875, "epoch": 2.144635447540012, "mse_loss": 0.0834575742483139, "step": 18090 }, { "epoch": 2.145820983995258, "grad_norm": 0.361328125, "learning_rate": 0.00018349211777891883, "loss": 0.8341, "step": 18100 }, { "contrastive_loss": 3.82568359375, "epoch": 2.145820983995258, "mse_loss": 0.06711364537477493, "step": 18100 }, { "epoch": 2.1470065204505038, "grad_norm": 0.5234375, "learning_rate": 0.00018346936016087128, "loss": 0.8356, "step": 18110 }, { "contrastive_loss": 3.825439453125, "epoch": 2.1470065204505038, "mse_loss": 0.05746123194694519, "step": 18110 }, { "epoch": 2.1481920569057498, "grad_norm": 0.478515625, "learning_rate": 0.00018344658828019296, "loss": 0.8426, "step": 18120 }, { "contrastive_loss": 3.9385986328125, "epoch": 2.1481920569057498, "mse_loss": 0.062234070152044296, "step": 18120 }, { "epoch": 2.1493775933609958, "grad_norm": 0.50390625, "learning_rate": 0.00018342380214077494, "loss": 0.8451, "step": 18130 }, { "contrastive_loss": 3.9503173828125, "epoch": 2.1493775933609958, "mse_loss": 0.06952831149101257, "step": 18130 }, { "epoch": 2.1505631298162418, "grad_norm": 0.447265625, "learning_rate": 0.00018340100174651081, "loss": 0.8494, "step": 18140 }, { "contrastive_loss": 3.8602294921875, "epoch": 2.1505631298162418, "mse_loss": 0.07543403655290604, "step": 18140 }, { "epoch": 2.1517486662714878, "grad_norm": 0.474609375, "learning_rate": 0.00018337818710129647, "loss": 0.8364, "step": 18150 }, { "contrastive_loss": 3.871337890625, "epoch": 2.1517486662714878, "mse_loss": 0.0539812371134758, "step": 18150 }, { "epoch": 2.1529342027267337, "grad_norm": 0.38671875, "learning_rate": 0.00018335535820903037, "loss": 0.8397, "step": 18160 }, { "contrastive_loss": 3.9022216796875, "epoch": 2.1529342027267337, "mse_loss": 0.060083527117967606, "step": 18160 }, { "epoch": 2.1541197391819797, "grad_norm": 0.46875, "learning_rate": 0.00018333251507361337, "loss": 0.8421, "step": 18170 }, { "contrastive_loss": 3.767333984375, "epoch": 2.1541197391819797, "mse_loss": 0.05537564307451248, "step": 18170 }, { "epoch": 2.1553052756372257, "grad_norm": 0.435546875, "learning_rate": 0.00018330965769894862, "loss": 0.8385, "step": 18180 }, { "contrastive_loss": 3.880615234375, "epoch": 2.1553052756372257, "mse_loss": 0.05997884273529053, "step": 18180 }, { "epoch": 2.1564908120924717, "grad_norm": 0.41796875, "learning_rate": 0.00018328678608894197, "loss": 0.8441, "step": 18190 }, { "contrastive_loss": 3.984130859375, "epoch": 2.1564908120924717, "mse_loss": 0.04292749613523483, "step": 18190 }, { "epoch": 2.1576763485477177, "grad_norm": 0.416015625, "learning_rate": 0.00018326390024750143, "loss": 0.8381, "step": 18200 }, { "contrastive_loss": 3.929443359375, "epoch": 2.1576763485477177, "mse_loss": 0.06443367153406143, "step": 18200 }, { "epoch": 2.1588618850029637, "grad_norm": 0.44140625, "learning_rate": 0.0001832410001785376, "loss": 0.8522, "step": 18210 }, { "contrastive_loss": 3.908203125, "epoch": 2.1588618850029637, "mse_loss": 0.06107347831130028, "step": 18210 }, { "epoch": 2.1600474214582097, "grad_norm": 0.3828125, "learning_rate": 0.0001832180858859635, "loss": 0.8355, "step": 18220 }, { "contrastive_loss": 4.0135498046875, "epoch": 2.1600474214582097, "mse_loss": 0.06441547721624374, "step": 18220 }, { "epoch": 2.1612329579134557, "grad_norm": 0.470703125, "learning_rate": 0.00018319515737369454, "loss": 0.84, "step": 18230 }, { "contrastive_loss": 3.8441162109375, "epoch": 2.1612329579134557, "mse_loss": 0.05809267982840538, "step": 18230 }, { "epoch": 2.1624184943687017, "grad_norm": 0.4921875, "learning_rate": 0.0001831722146456486, "loss": 0.8398, "step": 18240 }, { "contrastive_loss": 4.0029296875, "epoch": 2.1624184943687017, "mse_loss": 0.08421043306589127, "step": 18240 }, { "epoch": 2.1636040308239477, "grad_norm": 0.484375, "learning_rate": 0.00018314925770574592, "loss": 0.8526, "step": 18250 }, { "contrastive_loss": 3.8873291015625, "epoch": 2.1636040308239477, "mse_loss": 0.058749787509441376, "step": 18250 }, { "epoch": 2.1647895672791937, "grad_norm": 0.41015625, "learning_rate": 0.00018312628655790922, "loss": 0.8402, "step": 18260 }, { "contrastive_loss": 3.94384765625, "epoch": 2.1647895672791937, "mse_loss": 0.07332033663988113, "step": 18260 }, { "epoch": 2.1659751037344397, "grad_norm": 0.67578125, "learning_rate": 0.0001831033012060637, "loss": 0.8378, "step": 18270 }, { "contrastive_loss": 3.9888916015625, "epoch": 2.1659751037344397, "mse_loss": 0.06706882268190384, "step": 18270 }, { "epoch": 2.1671606401896857, "grad_norm": 0.453125, "learning_rate": 0.00018308030165413683, "loss": 0.8418, "step": 18280 }, { "contrastive_loss": 3.792724609375, "epoch": 2.1671606401896857, "mse_loss": 0.07530800998210907, "step": 18280 }, { "epoch": 2.1683461766449317, "grad_norm": 0.55078125, "learning_rate": 0.00018305728790605873, "loss": 0.8518, "step": 18290 }, { "contrastive_loss": 3.91845703125, "epoch": 2.1683461766449317, "mse_loss": 0.05905439332127571, "step": 18290 }, { "epoch": 2.1695317131001777, "grad_norm": 0.423828125, "learning_rate": 0.0001830342599657617, "loss": 0.8477, "step": 18300 }, { "contrastive_loss": 3.8870849609375, "epoch": 2.1695317131001777, "mse_loss": 0.049050699919462204, "step": 18300 }, { "epoch": 2.1707172495554237, "grad_norm": 0.65625, "learning_rate": 0.00018301121783718063, "loss": 0.8417, "step": 18310 }, { "contrastive_loss": 3.7147216796875, "epoch": 2.1707172495554237, "mse_loss": 0.05105841904878616, "step": 18310 }, { "epoch": 2.1719027860106697, "grad_norm": 0.34375, "learning_rate": 0.0001829881615242528, "loss": 0.8304, "step": 18320 }, { "contrastive_loss": 3.8956298828125, "epoch": 2.1719027860106697, "mse_loss": 0.06520669907331467, "step": 18320 }, { "epoch": 2.1730883224659157, "grad_norm": 0.447265625, "learning_rate": 0.00018296509103091788, "loss": 0.8378, "step": 18330 }, { "contrastive_loss": 3.7666015625, "epoch": 2.1730883224659157, "mse_loss": 0.04491815343499184, "step": 18330 }, { "epoch": 2.1742738589211617, "grad_norm": 0.44140625, "learning_rate": 0.00018294200636111802, "loss": 0.8476, "step": 18340 }, { "contrastive_loss": 4.0433349609375, "epoch": 2.1742738589211617, "mse_loss": 0.049188852310180664, "step": 18340 }, { "epoch": 2.1754593953764076, "grad_norm": 0.44140625, "learning_rate": 0.00018291890751879775, "loss": 0.8437, "step": 18350 }, { "contrastive_loss": 3.7913818359375, "epoch": 2.1754593953764076, "mse_loss": 0.05752319097518921, "step": 18350 }, { "epoch": 2.1766449318316536, "grad_norm": 0.466796875, "learning_rate": 0.00018289579450790405, "loss": 0.8323, "step": 18360 }, { "contrastive_loss": 3.8692626953125, "epoch": 2.1766449318316536, "mse_loss": 0.06611399352550507, "step": 18360 }, { "epoch": 2.1778304682868996, "grad_norm": 0.55078125, "learning_rate": 0.0001828726673323862, "loss": 0.854, "step": 18370 }, { "contrastive_loss": 3.856689453125, "epoch": 2.1778304682868996, "mse_loss": 0.0427393801510334, "step": 18370 }, { "epoch": 2.1790160047421456, "grad_norm": 0.50390625, "learning_rate": 0.00018284952599619613, "loss": 0.8407, "step": 18380 }, { "contrastive_loss": 4.021484375, "epoch": 2.1790160047421456, "mse_loss": 0.07783897966146469, "step": 18380 }, { "epoch": 2.1802015411973916, "grad_norm": 0.390625, "learning_rate": 0.000182826370503288, "loss": 0.8461, "step": 18390 }, { "contrastive_loss": 3.884765625, "epoch": 2.1802015411973916, "mse_loss": 0.055183179676532745, "step": 18390 }, { "epoch": 2.1813870776526376, "grad_norm": 0.4765625, "learning_rate": 0.00018280320085761845, "loss": 0.8411, "step": 18400 }, { "contrastive_loss": 3.8609619140625, "epoch": 2.1813870776526376, "mse_loss": 0.08912186324596405, "step": 18400 }, { "epoch": 2.1825726141078836, "grad_norm": 0.466796875, "learning_rate": 0.00018278001706314653, "loss": 0.8472, "step": 18410 }, { "contrastive_loss": 3.973876953125, "epoch": 2.1825726141078836, "mse_loss": 0.056164953857660294, "step": 18410 }, { "epoch": 2.18375815056313, "grad_norm": 0.54296875, "learning_rate": 0.00018275681912383377, "loss": 0.8454, "step": 18420 }, { "contrastive_loss": 3.8466796875, "epoch": 2.18375815056313, "mse_loss": 0.06601303815841675, "step": 18420 }, { "epoch": 2.184943687018376, "grad_norm": 0.4453125, "learning_rate": 0.00018273360704364398, "loss": 0.8376, "step": 18430 }, { "contrastive_loss": 4.039306640625, "epoch": 2.184943687018376, "mse_loss": 0.07220632582902908, "step": 18430 }, { "epoch": 2.186129223473622, "grad_norm": 0.5234375, "learning_rate": 0.00018271038082654355, "loss": 0.8562, "step": 18440 }, { "contrastive_loss": 3.933837890625, "epoch": 2.186129223473622, "mse_loss": 0.09578268229961395, "step": 18440 }, { "epoch": 2.187314759928868, "grad_norm": 0.376953125, "learning_rate": 0.00018268714047650115, "loss": 0.8453, "step": 18450 }, { "contrastive_loss": 3.801025390625, "epoch": 2.187314759928868, "mse_loss": 0.08070135861635208, "step": 18450 }, { "epoch": 2.188500296384114, "grad_norm": 0.474609375, "learning_rate": 0.00018266388599748795, "loss": 0.8478, "step": 18460 }, { "contrastive_loss": 3.817626953125, "epoch": 2.188500296384114, "mse_loss": 0.0638781264424324, "step": 18460 }, { "epoch": 2.18968583283936, "grad_norm": 0.408203125, "learning_rate": 0.00018264061739347751, "loss": 0.8465, "step": 18470 }, { "contrastive_loss": 3.827392578125, "epoch": 2.18968583283936, "mse_loss": 0.05244125798344612, "step": 18470 }, { "epoch": 2.190871369294606, "grad_norm": 0.494140625, "learning_rate": 0.00018261733466844575, "loss": 0.8343, "step": 18480 }, { "contrastive_loss": 3.8118896484375, "epoch": 2.190871369294606, "mse_loss": 0.07160495221614838, "step": 18480 }, { "epoch": 2.192056905749852, "grad_norm": 0.515625, "learning_rate": 0.0001825940378263711, "loss": 0.8514, "step": 18490 }, { "contrastive_loss": 3.9371337890625, "epoch": 2.192056905749852, "mse_loss": 0.06848659366369247, "step": 18490 }, { "epoch": 2.193242442205098, "grad_norm": 0.62890625, "learning_rate": 0.00018257072687123435, "loss": 0.8343, "step": 18500 }, { "contrastive_loss": 3.7337646484375, "epoch": 2.193242442205098, "mse_loss": 0.08076678216457367, "step": 18500 }, { "epoch": 2.194427978660344, "grad_norm": 0.40234375, "learning_rate": 0.00018254740180701867, "loss": 0.836, "step": 18510 }, { "contrastive_loss": 3.8704833984375, "epoch": 2.194427978660344, "mse_loss": 0.06586503237485886, "step": 18510 }, { "epoch": 2.19561351511559, "grad_norm": 0.458984375, "learning_rate": 0.00018252406263770973, "loss": 0.8306, "step": 18520 }, { "contrastive_loss": 3.7977294921875, "epoch": 2.19561351511559, "mse_loss": 0.08101543039083481, "step": 18520 }, { "epoch": 2.196799051570836, "grad_norm": 0.447265625, "learning_rate": 0.0001825007093672955, "loss": 0.8484, "step": 18530 }, { "contrastive_loss": 3.913818359375, "epoch": 2.196799051570836, "mse_loss": 0.07404173165559769, "step": 18530 }, { "epoch": 2.197984588026082, "grad_norm": 0.484375, "learning_rate": 0.00018247734199976643, "loss": 0.8576, "step": 18540 }, { "contrastive_loss": 3.9041748046875, "epoch": 2.197984588026082, "mse_loss": 0.06555580347776413, "step": 18540 }, { "epoch": 2.199170124481328, "grad_norm": 0.490234375, "learning_rate": 0.00018245396053911538, "loss": 0.8501, "step": 18550 }, { "contrastive_loss": 3.81494140625, "epoch": 2.199170124481328, "mse_loss": 0.04773912951350212, "step": 18550 }, { "epoch": 2.200355660936574, "grad_norm": 0.455078125, "learning_rate": 0.0001824305649893376, "loss": 0.8432, "step": 18560 }, { "contrastive_loss": 3.9327392578125, "epoch": 2.200355660936574, "mse_loss": 0.06900446116924286, "step": 18560 }, { "epoch": 2.20154119739182, "grad_norm": 0.44921875, "learning_rate": 0.00018240715535443075, "loss": 0.8419, "step": 18570 }, { "contrastive_loss": 3.9212646484375, "epoch": 2.20154119739182, "mse_loss": 0.0491306446492672, "step": 18570 }, { "epoch": 2.202726733847066, "grad_norm": 0.54296875, "learning_rate": 0.0001823837316383949, "loss": 0.8474, "step": 18580 }, { "contrastive_loss": 3.9744873046875, "epoch": 2.202726733847066, "mse_loss": 0.06063557043671608, "step": 18580 }, { "epoch": 2.203912270302312, "grad_norm": 0.44921875, "learning_rate": 0.00018236029384523247, "loss": 0.848, "step": 18590 }, { "contrastive_loss": 3.86181640625, "epoch": 2.203912270302312, "mse_loss": 0.05657333508133888, "step": 18590 }, { "epoch": 2.205097806757558, "grad_norm": 0.48046875, "learning_rate": 0.00018233684197894843, "loss": 0.8485, "step": 18600 }, { "contrastive_loss": 3.8504638671875, "epoch": 2.205097806757558, "mse_loss": 0.06715957075357437, "step": 18600 }, { "epoch": 2.206283343212804, "grad_norm": 0.482421875, "learning_rate": 0.00018231337604354998, "loss": 0.8333, "step": 18610 }, { "contrastive_loss": 3.9189453125, "epoch": 2.206283343212804, "mse_loss": 0.04418864846229553, "step": 18610 }, { "epoch": 2.20746887966805, "grad_norm": 0.53125, "learning_rate": 0.00018228989604304684, "loss": 0.8322, "step": 18620 }, { "contrastive_loss": 3.779296875, "epoch": 2.20746887966805, "mse_loss": 0.05561656132340431, "step": 18620 }, { "epoch": 2.208654416123296, "grad_norm": 0.41796875, "learning_rate": 0.0001822664019814511, "loss": 0.8393, "step": 18630 }, { "contrastive_loss": 4.0076904296875, "epoch": 2.208654416123296, "mse_loss": 0.0649261549115181, "step": 18630 }, { "epoch": 2.209839952578542, "grad_norm": 0.45703125, "learning_rate": 0.00018224289386277727, "loss": 0.8512, "step": 18640 }, { "contrastive_loss": 3.997314453125, "epoch": 2.209839952578542, "mse_loss": 0.05286794900894165, "step": 18640 }, { "epoch": 2.211025489033788, "grad_norm": 0.498046875, "learning_rate": 0.00018221937169104221, "loss": 0.8454, "step": 18650 }, { "contrastive_loss": 3.876953125, "epoch": 2.211025489033788, "mse_loss": 0.0467308945953846, "step": 18650 }, { "epoch": 2.212211025489034, "grad_norm": 0.416015625, "learning_rate": 0.00018219583547026528, "loss": 0.8487, "step": 18660 }, { "contrastive_loss": 3.9398193359375, "epoch": 2.212211025489034, "mse_loss": 0.06804041564464569, "step": 18660 }, { "epoch": 2.21339656194428, "grad_norm": 0.458984375, "learning_rate": 0.00018217228520446806, "loss": 0.8477, "step": 18670 }, { "contrastive_loss": 3.951416015625, "epoch": 2.21339656194428, "mse_loss": 0.05664430931210518, "step": 18670 }, { "epoch": 2.214582098399526, "grad_norm": 0.47265625, "learning_rate": 0.00018214872089767476, "loss": 0.8476, "step": 18680 }, { "contrastive_loss": 3.96630859375, "epoch": 2.214582098399526, "mse_loss": 0.06862922012805939, "step": 18680 }, { "epoch": 2.215767634854772, "grad_norm": 0.53125, "learning_rate": 0.0001821251425539118, "loss": 0.8474, "step": 18690 }, { "contrastive_loss": 3.96923828125, "epoch": 2.215767634854772, "mse_loss": 0.061233874410390854, "step": 18690 }, { "epoch": 2.216953171310018, "grad_norm": 0.37890625, "learning_rate": 0.00018210155017720812, "loss": 0.8392, "step": 18700 }, { "contrastive_loss": 3.787109375, "epoch": 2.216953171310018, "mse_loss": 0.09715145826339722, "step": 18700 }, { "epoch": 2.218138707765264, "grad_norm": 0.43359375, "learning_rate": 0.00018207794377159503, "loss": 0.8387, "step": 18710 }, { "contrastive_loss": 3.9139404296875, "epoch": 2.218138707765264, "mse_loss": 0.06337049603462219, "step": 18710 }, { "epoch": 2.21932424422051, "grad_norm": 0.39453125, "learning_rate": 0.00018205432334110616, "loss": 0.8425, "step": 18720 }, { "contrastive_loss": 3.8006591796875, "epoch": 2.21932424422051, "mse_loss": 0.0741092637181282, "step": 18720 }, { "epoch": 2.220509780675756, "grad_norm": 0.48046875, "learning_rate": 0.0001820306888897776, "loss": 0.8325, "step": 18730 }, { "contrastive_loss": 3.8646240234375, "epoch": 2.220509780675756, "mse_loss": 0.055068712681531906, "step": 18730 }, { "epoch": 2.221695317131002, "grad_norm": 0.412109375, "learning_rate": 0.00018200704042164786, "loss": 0.8439, "step": 18740 }, { "contrastive_loss": 3.8848876953125, "epoch": 2.221695317131002, "mse_loss": 0.06245087832212448, "step": 18740 }, { "epoch": 2.222880853586248, "grad_norm": 0.51953125, "learning_rate": 0.00018198337794075783, "loss": 0.8449, "step": 18750 }, { "contrastive_loss": 3.7877197265625, "epoch": 2.222880853586248, "mse_loss": 0.0764872282743454, "step": 18750 }, { "epoch": 2.224066390041494, "grad_norm": 0.416015625, "learning_rate": 0.00018195970145115076, "loss": 0.84, "step": 18760 }, { "contrastive_loss": 3.8079833984375, "epoch": 2.224066390041494, "mse_loss": 0.08515436202287674, "step": 18760 }, { "epoch": 2.22525192649674, "grad_norm": 0.404296875, "learning_rate": 0.0001819360109568723, "loss": 0.8393, "step": 18770 }, { "contrastive_loss": 3.9317626953125, "epoch": 2.22525192649674, "mse_loss": 0.05775139853358269, "step": 18770 }, { "epoch": 2.226437462951986, "grad_norm": 0.443359375, "learning_rate": 0.00018191230646197052, "loss": 0.8483, "step": 18780 }, { "contrastive_loss": 3.85107421875, "epoch": 2.226437462951986, "mse_loss": 0.0635792464017868, "step": 18780 }, { "epoch": 2.227622999407232, "grad_norm": 0.546875, "learning_rate": 0.0001818885879704959, "loss": 0.8464, "step": 18790 }, { "contrastive_loss": 3.8922119140625, "epoch": 2.227622999407232, "mse_loss": 0.06317044794559479, "step": 18790 }, { "epoch": 2.228808535862478, "grad_norm": 0.41796875, "learning_rate": 0.00018186485548650122, "loss": 0.844, "step": 18800 }, { "contrastive_loss": 3.8970947265625, "epoch": 2.228808535862478, "mse_loss": 0.07619040459394455, "step": 18800 }, { "epoch": 2.229994072317724, "grad_norm": 0.50390625, "learning_rate": 0.00018184110901404177, "loss": 0.8415, "step": 18810 }, { "contrastive_loss": 3.863037109375, "epoch": 2.229994072317724, "mse_loss": 0.050214555114507675, "step": 18810 }, { "epoch": 2.23117960877297, "grad_norm": 0.45703125, "learning_rate": 0.00018181734855717512, "loss": 0.8482, "step": 18820 }, { "contrastive_loss": 3.77685546875, "epoch": 2.23117960877297, "mse_loss": 0.048874806612730026, "step": 18820 }, { "epoch": 2.232365145228216, "grad_norm": 0.482421875, "learning_rate": 0.00018179357411996131, "loss": 0.8411, "step": 18830 }, { "contrastive_loss": 3.8619384765625, "epoch": 2.232365145228216, "mse_loss": 0.05588744208216667, "step": 18830 }, { "epoch": 2.233550681683462, "grad_norm": 0.4296875, "learning_rate": 0.00018176978570646278, "loss": 0.8441, "step": 18840 }, { "contrastive_loss": 3.8673095703125, "epoch": 2.233550681683462, "mse_loss": 0.07397612184286118, "step": 18840 }, { "epoch": 2.234736218138708, "grad_norm": 0.4453125, "learning_rate": 0.00018174598332074425, "loss": 0.8404, "step": 18850 }, { "contrastive_loss": 3.947021484375, "epoch": 2.234736218138708, "mse_loss": 0.052177634090185165, "step": 18850 }, { "epoch": 2.235921754593954, "grad_norm": 0.400390625, "learning_rate": 0.00018172216696687294, "loss": 0.8425, "step": 18860 }, { "contrastive_loss": 3.840576171875, "epoch": 2.235921754593954, "mse_loss": 0.05461103096604347, "step": 18860 }, { "epoch": 2.2371072910492, "grad_norm": 0.515625, "learning_rate": 0.0001816983366489184, "loss": 0.846, "step": 18870 }, { "contrastive_loss": 3.9185791015625, "epoch": 2.2371072910492, "mse_loss": 0.07412277162075043, "step": 18870 }, { "epoch": 2.238292827504446, "grad_norm": 0.4375, "learning_rate": 0.0001816744923709526, "loss": 0.8394, "step": 18880 }, { "contrastive_loss": 3.8111572265625, "epoch": 2.238292827504446, "mse_loss": 0.05346452444791794, "step": 18880 }, { "epoch": 2.239478363959692, "grad_norm": 0.490234375, "learning_rate": 0.00018165063413704983, "loss": 0.8452, "step": 18890 }, { "contrastive_loss": 3.8468017578125, "epoch": 2.239478363959692, "mse_loss": 0.0621027946472168, "step": 18890 }, { "epoch": 2.240663900414938, "grad_norm": 0.50390625, "learning_rate": 0.00018162676195128684, "loss": 0.8398, "step": 18900 }, { "contrastive_loss": 3.8621826171875, "epoch": 2.240663900414938, "mse_loss": 0.04831495136022568, "step": 18900 }, { "epoch": 2.241849436870184, "grad_norm": 0.40234375, "learning_rate": 0.00018160287581774274, "loss": 0.8425, "step": 18910 }, { "contrastive_loss": 3.9595947265625, "epoch": 2.241849436870184, "mse_loss": 0.06200682371854782, "step": 18910 }, { "epoch": 2.24303497332543, "grad_norm": 0.439453125, "learning_rate": 0.000181578975740499, "loss": 0.8536, "step": 18920 }, { "contrastive_loss": 3.862060546875, "epoch": 2.24303497332543, "mse_loss": 0.0625648945569992, "step": 18920 }, { "epoch": 2.2442205097806758, "grad_norm": 0.419921875, "learning_rate": 0.00018155506172363948, "loss": 0.8318, "step": 18930 }, { "contrastive_loss": 3.8900146484375, "epoch": 2.2442205097806758, "mse_loss": 0.07219014316797256, "step": 18930 }, { "epoch": 2.2454060462359218, "grad_norm": 0.431640625, "learning_rate": 0.00018153113377125047, "loss": 0.8418, "step": 18940 }, { "contrastive_loss": 3.9234619140625, "epoch": 2.2454060462359218, "mse_loss": 0.051413364708423615, "step": 18940 }, { "epoch": 2.2465915826911678, "grad_norm": 0.388671875, "learning_rate": 0.00018150719188742058, "loss": 0.8454, "step": 18950 }, { "contrastive_loss": 3.848876953125, "epoch": 2.2465915826911678, "mse_loss": 0.07234915345907211, "step": 18950 }, { "epoch": 2.2477771191464138, "grad_norm": 0.44140625, "learning_rate": 0.0001814832360762408, "loss": 0.8431, "step": 18960 }, { "contrastive_loss": 3.835205078125, "epoch": 2.2477771191464138, "mse_loss": 0.06458581984043121, "step": 18960 }, { "epoch": 2.2489626556016598, "grad_norm": 0.42578125, "learning_rate": 0.00018145926634180457, "loss": 0.8317, "step": 18970 }, { "contrastive_loss": 3.8544921875, "epoch": 2.2489626556016598, "mse_loss": 0.039848972111940384, "step": 18970 }, { "epoch": 2.2501481920569057, "grad_norm": 0.34375, "learning_rate": 0.00018143528268820764, "loss": 0.8469, "step": 18980 }, { "contrastive_loss": 3.740478515625, "epoch": 2.2501481920569057, "mse_loss": 0.06532178074121475, "step": 18980 }, { "epoch": 2.2513337285121517, "grad_norm": 0.51171875, "learning_rate": 0.00018141128511954814, "loss": 0.8362, "step": 18990 }, { "contrastive_loss": 3.7774658203125, "epoch": 2.2513337285121517, "mse_loss": 0.0719202384352684, "step": 18990 }, { "epoch": 2.2525192649673977, "grad_norm": 0.4140625, "learning_rate": 0.0001813872736399266, "loss": 0.8425, "step": 19000 }, { "contrastive_loss": 3.81201171875, "epoch": 2.2525192649673977, "mse_loss": 0.06363186240196228, "step": 19000 }, { "epoch": 2.2537048014226437, "grad_norm": 0.49609375, "learning_rate": 0.000181363248253446, "loss": 0.8321, "step": 19010 }, { "contrastive_loss": 3.808349609375, "epoch": 2.2537048014226437, "mse_loss": 0.056977298110723495, "step": 19010 }, { "epoch": 2.2548903378778897, "grad_norm": 0.51171875, "learning_rate": 0.00018133920896421153, "loss": 0.8489, "step": 19020 }, { "contrastive_loss": 3.7716064453125, "epoch": 2.2548903378778897, "mse_loss": 0.07441885024309158, "step": 19020 }, { "epoch": 2.2560758743331357, "grad_norm": 0.39453125, "learning_rate": 0.00018131515577633086, "loss": 0.8344, "step": 19030 }, { "contrastive_loss": 3.9229736328125, "epoch": 2.2560758743331357, "mse_loss": 0.07431571930646896, "step": 19030 }, { "epoch": 2.2572614107883817, "grad_norm": 0.455078125, "learning_rate": 0.0001812910886939141, "loss": 0.8394, "step": 19040 }, { "contrastive_loss": 3.90478515625, "epoch": 2.2572614107883817, "mse_loss": 0.05074420943856239, "step": 19040 }, { "epoch": 2.2584469472436277, "grad_norm": 0.4375, "learning_rate": 0.00018126700772107355, "loss": 0.8281, "step": 19050 }, { "contrastive_loss": 3.8206787109375, "epoch": 2.2584469472436277, "mse_loss": 0.0633632019162178, "step": 19050 }, { "epoch": 2.2596324836988737, "grad_norm": 0.46875, "learning_rate": 0.00018124291286192404, "loss": 0.8381, "step": 19060 }, { "contrastive_loss": 3.9293212890625, "epoch": 2.2596324836988737, "mse_loss": 0.052704863250255585, "step": 19060 }, { "epoch": 2.2608180201541197, "grad_norm": 0.41015625, "learning_rate": 0.00018121880412058273, "loss": 0.8341, "step": 19070 }, { "contrastive_loss": 3.8389892578125, "epoch": 2.2608180201541197, "mse_loss": 0.07015088945627213, "step": 19070 }, { "epoch": 2.2620035566093657, "grad_norm": 0.50390625, "learning_rate": 0.00018119468150116914, "loss": 0.8467, "step": 19080 }, { "contrastive_loss": 3.974853515625, "epoch": 2.2620035566093657, "mse_loss": 0.06557641178369522, "step": 19080 }, { "epoch": 2.2631890930646117, "grad_norm": 0.4765625, "learning_rate": 0.00018117054500780514, "loss": 0.8456, "step": 19090 }, { "contrastive_loss": 3.9110107421875, "epoch": 2.2631890930646117, "mse_loss": 0.048466019332408905, "step": 19090 }, { "epoch": 2.2643746295198577, "grad_norm": 0.421875, "learning_rate": 0.00018114639464461503, "loss": 0.8475, "step": 19100 }, { "contrastive_loss": 3.8360595703125, "epoch": 2.2643746295198577, "mse_loss": 0.061357174068689346, "step": 19100 }, { "epoch": 2.2655601659751037, "grad_norm": 0.482421875, "learning_rate": 0.00018112223041572546, "loss": 0.8408, "step": 19110 }, { "contrastive_loss": 3.9854736328125, "epoch": 2.2655601659751037, "mse_loss": 0.06655483692884445, "step": 19110 }, { "epoch": 2.2667457024303497, "grad_norm": 0.39453125, "learning_rate": 0.00018109805232526536, "loss": 0.8552, "step": 19120 }, { "contrastive_loss": 3.9517822265625, "epoch": 2.2667457024303497, "mse_loss": 0.051363442093133926, "step": 19120 }, { "epoch": 2.2679312388855957, "grad_norm": 0.41796875, "learning_rate": 0.0001810738603773662, "loss": 0.839, "step": 19130 }, { "contrastive_loss": 3.9208984375, "epoch": 2.2679312388855957, "mse_loss": 0.06816011667251587, "step": 19130 }, { "epoch": 2.2691167753408417, "grad_norm": 0.51171875, "learning_rate": 0.00018104965457616166, "loss": 0.8328, "step": 19140 }, { "contrastive_loss": 3.9246826171875, "epoch": 2.2691167753408417, "mse_loss": 0.05670473352074623, "step": 19140 }, { "epoch": 2.2703023117960877, "grad_norm": 0.41015625, "learning_rate": 0.00018102543492578782, "loss": 0.846, "step": 19150 }, { "contrastive_loss": 3.8048095703125, "epoch": 2.2703023117960877, "mse_loss": 0.06400714814662933, "step": 19150 }, { "epoch": 2.2714878482513337, "grad_norm": 0.470703125, "learning_rate": 0.00018100120143038325, "loss": 0.8386, "step": 19160 }, { "contrastive_loss": 3.8953857421875, "epoch": 2.2714878482513337, "mse_loss": 0.04981442168354988, "step": 19160 }, { "epoch": 2.2726733847065796, "grad_norm": 0.337890625, "learning_rate": 0.00018097695409408874, "loss": 0.8445, "step": 19170 }, { "contrastive_loss": 3.7935791015625, "epoch": 2.2726733847065796, "mse_loss": 0.07687236368656158, "step": 19170 }, { "epoch": 2.2738589211618256, "grad_norm": 0.4921875, "learning_rate": 0.0001809526929210475, "loss": 0.832, "step": 19180 }, { "contrastive_loss": 3.9140625, "epoch": 2.2738589211618256, "mse_loss": 0.07744600623846054, "step": 19180 }, { "epoch": 2.2750444576170716, "grad_norm": 0.44140625, "learning_rate": 0.00018092841791540512, "loss": 0.8246, "step": 19190 }, { "contrastive_loss": 3.8895263671875, "epoch": 2.2750444576170716, "mse_loss": 0.06688069552183151, "step": 19190 }, { "epoch": 2.2762299940723176, "grad_norm": 0.359375, "learning_rate": 0.00018090412908130946, "loss": 0.828, "step": 19200 }, { "contrastive_loss": 3.9208984375, "epoch": 2.2762299940723176, "mse_loss": 0.06118433550000191, "step": 19200 }, { "epoch": 2.2774155305275636, "grad_norm": 0.41015625, "learning_rate": 0.00018087982642291093, "loss": 0.843, "step": 19210 }, { "contrastive_loss": 3.9066162109375, "epoch": 2.2774155305275636, "mse_loss": 0.05949663370847702, "step": 19210 }, { "epoch": 2.2786010669828096, "grad_norm": 0.66015625, "learning_rate": 0.0001808555099443621, "loss": 0.8557, "step": 19220 }, { "contrastive_loss": 4.0501708984375, "epoch": 2.2786010669828096, "mse_loss": 0.0778544470667839, "step": 19220 }, { "epoch": 2.2797866034380556, "grad_norm": 0.62109375, "learning_rate": 0.00018083117964981803, "loss": 0.8393, "step": 19230 }, { "contrastive_loss": 3.929931640625, "epoch": 2.2797866034380556, "mse_loss": 0.06271110475063324, "step": 19230 }, { "epoch": 2.2809721398933016, "grad_norm": 0.380859375, "learning_rate": 0.0001808068355434361, "loss": 0.8366, "step": 19240 }, { "contrastive_loss": 3.9185791015625, "epoch": 2.2809721398933016, "mse_loss": 0.04993772134184837, "step": 19240 }, { "epoch": 2.2821576763485476, "grad_norm": 0.4375, "learning_rate": 0.00018078247762937604, "loss": 0.8376, "step": 19250 }, { "contrastive_loss": 3.99169921875, "epoch": 2.2821576763485476, "mse_loss": 0.0752902701497078, "step": 19250 }, { "epoch": 2.2833432128037936, "grad_norm": 0.37890625, "learning_rate": 0.00018075810591179997, "loss": 0.8523, "step": 19260 }, { "contrastive_loss": 3.8927001953125, "epoch": 2.2833432128037936, "mse_loss": 0.06970763206481934, "step": 19260 }, { "epoch": 2.2845287492590396, "grad_norm": 0.4921875, "learning_rate": 0.00018073372039487234, "loss": 0.8428, "step": 19270 }, { "contrastive_loss": 3.8131103515625, "epoch": 2.2845287492590396, "mse_loss": 0.06451509147882462, "step": 19270 }, { "epoch": 2.2857142857142856, "grad_norm": 0.458984375, "learning_rate": 0.00018070932108275994, "loss": 0.8479, "step": 19280 }, { "contrastive_loss": 3.8896484375, "epoch": 2.2857142857142856, "mse_loss": 0.09625981748104095, "step": 19280 }, { "epoch": 2.2868998221695316, "grad_norm": 0.439453125, "learning_rate": 0.000180684907979632, "loss": 0.8466, "step": 19290 }, { "contrastive_loss": 3.8284912109375, "epoch": 2.2868998221695316, "mse_loss": 0.07266538590192795, "step": 19290 }, { "epoch": 2.2880853586247776, "grad_norm": 0.51171875, "learning_rate": 0.00018066048108966, "loss": 0.8457, "step": 19300 }, { "contrastive_loss": 3.981689453125, "epoch": 2.2880853586247776, "mse_loss": 0.07990801334381104, "step": 19300 }, { "epoch": 2.2892708950800236, "grad_norm": 0.462890625, "learning_rate": 0.00018063604041701787, "loss": 0.8444, "step": 19310 }, { "contrastive_loss": 3.78466796875, "epoch": 2.2892708950800236, "mse_loss": 0.055992309004068375, "step": 19310 }, { "epoch": 2.2904564315352696, "grad_norm": 0.384765625, "learning_rate": 0.00018061158596588184, "loss": 0.8276, "step": 19320 }, { "contrastive_loss": 3.814697265625, "epoch": 2.2904564315352696, "mse_loss": 0.06851457059383392, "step": 19320 }, { "epoch": 2.2916419679905156, "grad_norm": 0.494140625, "learning_rate": 0.00018058711774043048, "loss": 0.8327, "step": 19330 }, { "contrastive_loss": 3.9476318359375, "epoch": 2.2916419679905156, "mse_loss": 0.052904702723026276, "step": 19330 }, { "epoch": 2.2928275044457616, "grad_norm": 0.478515625, "learning_rate": 0.00018056263574484476, "loss": 0.8413, "step": 19340 }, { "contrastive_loss": 3.9088134765625, "epoch": 2.2928275044457616, "mse_loss": 0.05394964665174484, "step": 19340 }, { "epoch": 2.2940130409010075, "grad_norm": 0.455078125, "learning_rate": 0.00018053813998330798, "loss": 0.8482, "step": 19350 }, { "contrastive_loss": 3.94140625, "epoch": 2.2940130409010075, "mse_loss": 0.06369668990373611, "step": 19350 }, { "epoch": 2.2951985773562535, "grad_norm": 0.451171875, "learning_rate": 0.00018051363046000583, "loss": 0.8399, "step": 19360 }, { "contrastive_loss": 3.8402099609375, "epoch": 2.2951985773562535, "mse_loss": 0.06534446030855179, "step": 19360 }, { "epoch": 2.2963841138114995, "grad_norm": 0.4453125, "learning_rate": 0.0001804891071791263, "loss": 0.8384, "step": 19370 }, { "contrastive_loss": 3.9156494140625, "epoch": 2.2963841138114995, "mse_loss": 0.06939326226711273, "step": 19370 }, { "epoch": 2.2975696502667455, "grad_norm": 0.494140625, "learning_rate": 0.00018046457014485968, "loss": 0.8427, "step": 19380 }, { "contrastive_loss": 3.7301025390625, "epoch": 2.2975696502667455, "mse_loss": 0.04716891795396805, "step": 19380 }, { "epoch": 2.2987551867219915, "grad_norm": 0.453125, "learning_rate": 0.00018044001936139874, "loss": 0.841, "step": 19390 }, { "contrastive_loss": 3.92529296875, "epoch": 2.2987551867219915, "mse_loss": 0.07342253625392914, "step": 19390 }, { "epoch": 2.2999407231772375, "grad_norm": 0.453125, "learning_rate": 0.00018041545483293855, "loss": 0.845, "step": 19400 }, { "contrastive_loss": 4.0242919921875, "epoch": 2.2999407231772375, "mse_loss": 0.051980216056108475, "step": 19400 }, { "epoch": 2.3011262596324835, "grad_norm": 0.380859375, "learning_rate": 0.00018039087656367652, "loss": 0.8508, "step": 19410 }, { "contrastive_loss": 3.8193359375, "epoch": 2.3011262596324835, "mse_loss": 0.06478080153465271, "step": 19410 }, { "epoch": 2.3023117960877295, "grad_norm": 0.578125, "learning_rate": 0.00018036628455781232, "loss": 0.8391, "step": 19420 }, { "contrastive_loss": 3.779541015625, "epoch": 2.3023117960877295, "mse_loss": 0.06544370949268341, "step": 19420 }, { "epoch": 2.3034973325429755, "grad_norm": 0.57421875, "learning_rate": 0.00018034167881954817, "loss": 0.8396, "step": 19430 }, { "contrastive_loss": 3.91943359375, "epoch": 2.3034973325429755, "mse_loss": 0.04553135484457016, "step": 19430 }, { "epoch": 2.3046828689982215, "grad_norm": 0.51953125, "learning_rate": 0.00018031705935308843, "loss": 0.8398, "step": 19440 }, { "contrastive_loss": 3.9476318359375, "epoch": 2.3046828689982215, "mse_loss": 0.06490936875343323, "step": 19440 }, { "epoch": 2.3058684054534675, "grad_norm": 0.443359375, "learning_rate": 0.00018029242616263993, "loss": 0.8434, "step": 19450 }, { "contrastive_loss": 3.9735107421875, "epoch": 2.3058684054534675, "mse_loss": 0.07289520651102066, "step": 19450 }, { "epoch": 2.3070539419087135, "grad_norm": 0.474609375, "learning_rate": 0.0001802677792524118, "loss": 0.8295, "step": 19460 }, { "contrastive_loss": 3.9837646484375, "epoch": 2.3070539419087135, "mse_loss": 0.06603504717350006, "step": 19460 }, { "epoch": 2.3082394783639595, "grad_norm": 0.404296875, "learning_rate": 0.00018024311862661554, "loss": 0.8425, "step": 19470 }, { "contrastive_loss": 3.863525390625, "epoch": 2.3082394783639595, "mse_loss": 0.058146338909864426, "step": 19470 }, { "epoch": 2.3094250148192055, "grad_norm": 0.453125, "learning_rate": 0.00018021844428946492, "loss": 0.8455, "step": 19480 }, { "contrastive_loss": 3.8218994140625, "epoch": 2.3094250148192055, "mse_loss": 0.08655042201280594, "step": 19480 }, { "epoch": 2.3106105512744515, "grad_norm": 0.5546875, "learning_rate": 0.00018019375624517617, "loss": 0.8439, "step": 19490 }, { "contrastive_loss": 3.879638671875, "epoch": 2.3106105512744515, "mse_loss": 0.051036287099123, "step": 19490 }, { "epoch": 2.3117960877296975, "grad_norm": 0.455078125, "learning_rate": 0.0001801690544979678, "loss": 0.8421, "step": 19500 }, { "contrastive_loss": 3.867431640625, "epoch": 2.3117960877296975, "mse_loss": 0.06128227710723877, "step": 19500 }, { "epoch": 2.3129816241849435, "grad_norm": 0.490234375, "learning_rate": 0.00018014433905206063, "loss": 0.8471, "step": 19510 }, { "contrastive_loss": 3.8223876953125, "epoch": 2.3129816241849435, "mse_loss": 0.04475383087992668, "step": 19510 }, { "epoch": 2.3141671606401895, "grad_norm": 0.5, "learning_rate": 0.00018011960991167787, "loss": 0.8402, "step": 19520 }, { "contrastive_loss": 3.8433837890625, "epoch": 2.3141671606401895, "mse_loss": 0.07670053094625473, "step": 19520 }, { "epoch": 2.3153526970954355, "grad_norm": 0.419921875, "learning_rate": 0.00018009486708104504, "loss": 0.8423, "step": 19530 }, { "contrastive_loss": 3.812255859375, "epoch": 2.3153526970954355, "mse_loss": 0.08012441545724869, "step": 19530 }, { "epoch": 2.3165382335506814, "grad_norm": 0.435546875, "learning_rate": 0.00018007011056439006, "loss": 0.8323, "step": 19540 }, { "contrastive_loss": 3.87890625, "epoch": 2.3165382335506814, "mse_loss": 0.05033285170793533, "step": 19540 }, { "epoch": 2.3177237700059274, "grad_norm": 0.44140625, "learning_rate": 0.00018004534036594307, "loss": 0.849, "step": 19550 }, { "contrastive_loss": 3.9195556640625, "epoch": 2.3177237700059274, "mse_loss": 0.0736469030380249, "step": 19550 }, { "epoch": 2.3189093064611734, "grad_norm": 0.427734375, "learning_rate": 0.00018002055648993668, "loss": 0.8424, "step": 19560 }, { "contrastive_loss": 3.964599609375, "epoch": 2.3189093064611734, "mse_loss": 0.06840752810239792, "step": 19560 }, { "epoch": 2.3200948429164194, "grad_norm": 0.4375, "learning_rate": 0.00017999575894060574, "loss": 0.8415, "step": 19570 }, { "contrastive_loss": 3.9630126953125, "epoch": 2.3200948429164194, "mse_loss": 0.06806357949972153, "step": 19570 }, { "epoch": 2.321280379371666, "grad_norm": 0.51171875, "learning_rate": 0.0001799709477221875, "loss": 0.8385, "step": 19580 }, { "contrastive_loss": 3.9588623046875, "epoch": 2.321280379371666, "mse_loss": 0.06802170723676682, "step": 19580 }, { "epoch": 2.322465915826912, "grad_norm": 0.5078125, "learning_rate": 0.00017994612283892146, "loss": 0.8363, "step": 19590 }, { "contrastive_loss": 3.9237060546875, "epoch": 2.322465915826912, "mse_loss": 0.07903827726840973, "step": 19590 }, { "epoch": 2.323651452282158, "grad_norm": 0.404296875, "learning_rate": 0.00017992128429504962, "loss": 0.842, "step": 19600 }, { "contrastive_loss": 3.824951171875, "epoch": 2.323651452282158, "mse_loss": 0.06511061638593674, "step": 19600 }, { "epoch": 2.324836988737404, "grad_norm": 0.466796875, "learning_rate": 0.00017989643209481612, "loss": 0.8245, "step": 19610 }, { "contrastive_loss": 3.829345703125, "epoch": 2.324836988737404, "mse_loss": 0.0456199124455452, "step": 19610 }, { "epoch": 2.32602252519265, "grad_norm": 0.54296875, "learning_rate": 0.00017987156624246753, "loss": 0.8365, "step": 19620 }, { "contrastive_loss": 3.7191162109375, "epoch": 2.32602252519265, "mse_loss": 0.06785713881254196, "step": 19620 }, { "epoch": 2.327208061647896, "grad_norm": 0.375, "learning_rate": 0.00017984668674225277, "loss": 0.8352, "step": 19630 }, { "contrastive_loss": 3.896484375, "epoch": 2.327208061647896, "mse_loss": 0.07245175540447235, "step": 19630 }, { "epoch": 2.328393598103142, "grad_norm": 0.42578125, "learning_rate": 0.00017982179359842307, "loss": 0.8437, "step": 19640 }, { "contrastive_loss": 3.847900390625, "epoch": 2.328393598103142, "mse_loss": 0.051860205829143524, "step": 19640 }, { "epoch": 2.329579134558388, "grad_norm": 0.37890625, "learning_rate": 0.00017979688681523198, "loss": 0.8341, "step": 19650 }, { "contrastive_loss": 3.8533935546875, "epoch": 2.329579134558388, "mse_loss": 0.06190517917275429, "step": 19650 }, { "epoch": 2.330764671013634, "grad_norm": 0.4375, "learning_rate": 0.00017977196639693536, "loss": 0.844, "step": 19660 }, { "contrastive_loss": 3.9208984375, "epoch": 2.330764671013634, "mse_loss": 0.05522335320711136, "step": 19660 }, { "epoch": 2.33195020746888, "grad_norm": 0.431640625, "learning_rate": 0.00017974703234779148, "loss": 0.8307, "step": 19670 }, { "contrastive_loss": 3.7677001953125, "epoch": 2.33195020746888, "mse_loss": 0.054190803319215775, "step": 19670 }, { "epoch": 2.333135743924126, "grad_norm": 0.37890625, "learning_rate": 0.0001797220846720608, "loss": 0.8464, "step": 19680 }, { "contrastive_loss": 3.927978515625, "epoch": 2.333135743924126, "mse_loss": 0.06310997903347015, "step": 19680 }, { "epoch": 2.334321280379372, "grad_norm": 0.404296875, "learning_rate": 0.00017969712337400633, "loss": 0.8388, "step": 19690 }, { "contrastive_loss": 3.833251953125, "epoch": 2.334321280379372, "mse_loss": 0.05135819688439369, "step": 19690 }, { "epoch": 2.335506816834618, "grad_norm": 0.384765625, "learning_rate": 0.00017967214845789317, "loss": 0.8429, "step": 19700 }, { "contrastive_loss": 3.8665771484375, "epoch": 2.335506816834618, "mse_loss": 0.07179118692874908, "step": 19700 }, { "epoch": 2.336692353289864, "grad_norm": 0.365234375, "learning_rate": 0.00017964715992798883, "loss": 0.8492, "step": 19710 }, { "contrastive_loss": 3.8193359375, "epoch": 2.336692353289864, "mse_loss": 0.05719253793358803, "step": 19710 }, { "epoch": 2.33787788974511, "grad_norm": 0.5, "learning_rate": 0.00017962215778856327, "loss": 0.832, "step": 19720 }, { "contrastive_loss": 3.93505859375, "epoch": 2.33787788974511, "mse_loss": 0.04071234539151192, "step": 19720 }, { "epoch": 2.339063426200356, "grad_norm": 0.388671875, "learning_rate": 0.00017959714204388857, "loss": 0.8411, "step": 19730 }, { "contrastive_loss": 3.8311767578125, "epoch": 2.339063426200356, "mse_loss": 0.0645754411816597, "step": 19730 }, { "epoch": 2.340248962655602, "grad_norm": 0.49609375, "learning_rate": 0.00017957211269823935, "loss": 0.8492, "step": 19740 }, { "contrastive_loss": 3.8831787109375, "epoch": 2.340248962655602, "mse_loss": 0.05913568660616875, "step": 19740 }, { "epoch": 2.3414344991108478, "grad_norm": 0.494140625, "learning_rate": 0.0001795470697558923, "loss": 0.8442, "step": 19750 }, { "contrastive_loss": 3.8677978515625, "epoch": 2.3414344991108478, "mse_loss": 0.07910459488630295, "step": 19750 }, { "epoch": 2.3426200355660938, "grad_norm": 0.400390625, "learning_rate": 0.0001795220132211267, "loss": 0.8469, "step": 19760 }, { "contrastive_loss": 3.8848876953125, "epoch": 2.3426200355660938, "mse_loss": 0.0795234814286232, "step": 19760 }, { "epoch": 2.3438055720213398, "grad_norm": 0.470703125, "learning_rate": 0.00017949694309822394, "loss": 0.836, "step": 19770 }, { "contrastive_loss": 3.838623046875, "epoch": 2.3438055720213398, "mse_loss": 0.06955666095018387, "step": 19770 }, { "epoch": 2.3449911084765858, "grad_norm": 0.41796875, "learning_rate": 0.00017947185939146785, "loss": 0.8319, "step": 19780 }, { "contrastive_loss": 3.9083251953125, "epoch": 2.3449911084765858, "mse_loss": 0.0653911754488945, "step": 19780 }, { "epoch": 2.3461766449318318, "grad_norm": 0.65234375, "learning_rate": 0.00017944676210514455, "loss": 0.8351, "step": 19790 }, { "contrastive_loss": 3.8809814453125, "epoch": 2.3461766449318318, "mse_loss": 0.060608964413404465, "step": 19790 }, { "epoch": 2.3473621813870778, "grad_norm": 0.443359375, "learning_rate": 0.0001794216512435425, "loss": 0.8442, "step": 19800 }, { "contrastive_loss": 3.73974609375, "epoch": 2.3473621813870778, "mse_loss": 0.10294930636882782, "step": 19800 }, { "epoch": 2.3485477178423237, "grad_norm": 0.48046875, "learning_rate": 0.0001793965268109524, "loss": 0.8469, "step": 19810 }, { "contrastive_loss": 3.79296875, "epoch": 2.3485477178423237, "mse_loss": 0.048076894134283066, "step": 19810 }, { "epoch": 2.3497332542975697, "grad_norm": 0.404296875, "learning_rate": 0.0001793713888116674, "loss": 0.8376, "step": 19820 }, { "contrastive_loss": 3.884033203125, "epoch": 2.3497332542975697, "mse_loss": 0.06317310035228729, "step": 19820 }, { "epoch": 2.3509187907528157, "grad_norm": 0.3984375, "learning_rate": 0.00017934623724998288, "loss": 0.8359, "step": 19830 }, { "contrastive_loss": 3.9443359375, "epoch": 2.3509187907528157, "mse_loss": 0.06285279989242554, "step": 19830 }, { "epoch": 2.3521043272080617, "grad_norm": 0.37890625, "learning_rate": 0.0001793210721301965, "loss": 0.8369, "step": 19840 }, { "contrastive_loss": 3.904541015625, "epoch": 2.3521043272080617, "mse_loss": 0.05403892323374748, "step": 19840 }, { "epoch": 2.3532898636633077, "grad_norm": 0.609375, "learning_rate": 0.00017929589345660834, "loss": 0.8514, "step": 19850 }, { "contrastive_loss": 3.8580322265625, "epoch": 2.3532898636633077, "mse_loss": 0.0755317285656929, "step": 19850 }, { "epoch": 2.3544754001185537, "grad_norm": 0.349609375, "learning_rate": 0.00017927070123352075, "loss": 0.851, "step": 19860 }, { "contrastive_loss": 3.9322509765625, "epoch": 2.3544754001185537, "mse_loss": 0.0701834186911583, "step": 19860 }, { "epoch": 2.3556609365737997, "grad_norm": 0.49609375, "learning_rate": 0.00017924549546523836, "loss": 0.8452, "step": 19870 }, { "contrastive_loss": 3.9046630859375, "epoch": 2.3556609365737997, "mse_loss": 0.07898092269897461, "step": 19870 }, { "epoch": 2.3568464730290457, "grad_norm": 0.365234375, "learning_rate": 0.00017922027615606818, "loss": 0.8386, "step": 19880 }, { "contrastive_loss": 3.783203125, "epoch": 2.3568464730290457, "mse_loss": 0.060771021991968155, "step": 19880 }, { "epoch": 2.3580320094842917, "grad_norm": 0.470703125, "learning_rate": 0.00017919504331031946, "loss": 0.8388, "step": 19890 }, { "contrastive_loss": 3.7476806640625, "epoch": 2.3580320094842917, "mse_loss": 0.05481315404176712, "step": 19890 }, { "epoch": 2.3592175459395377, "grad_norm": 0.46484375, "learning_rate": 0.00017916979693230386, "loss": 0.8318, "step": 19900 }, { "contrastive_loss": 3.8226318359375, "epoch": 2.3592175459395377, "mse_loss": 0.04856185242533684, "step": 19900 }, { "epoch": 2.3604030823947837, "grad_norm": 0.458984375, "learning_rate": 0.00017914453702633524, "loss": 0.8359, "step": 19910 }, { "contrastive_loss": 3.8292236328125, "epoch": 2.3604030823947837, "mse_loss": 0.06067245453596115, "step": 19910 }, { "epoch": 2.3615886188500297, "grad_norm": 0.5078125, "learning_rate": 0.00017911926359672986, "loss": 0.8331, "step": 19920 }, { "contrastive_loss": 3.8731689453125, "epoch": 2.3615886188500297, "mse_loss": 0.06610902398824692, "step": 19920 }, { "epoch": 2.3627741553052757, "grad_norm": 0.427734375, "learning_rate": 0.00017909397664780624, "loss": 0.8361, "step": 19930 }, { "contrastive_loss": 3.7415771484375, "epoch": 2.3627741553052757, "mse_loss": 0.04400473088026047, "step": 19930 }, { "epoch": 2.3639596917605217, "grad_norm": 0.5078125, "learning_rate": 0.00017906867618388525, "loss": 0.8304, "step": 19940 }, { "contrastive_loss": 3.8839111328125, "epoch": 2.3639596917605217, "mse_loss": 0.05261356756091118, "step": 19940 }, { "epoch": 2.3651452282157677, "grad_norm": 0.484375, "learning_rate": 0.00017904336220929, "loss": 0.8377, "step": 19950 }, { "contrastive_loss": 3.994140625, "epoch": 2.3651452282157677, "mse_loss": 0.052960872650146484, "step": 19950 }, { "epoch": 2.3663307646710137, "grad_norm": 0.419921875, "learning_rate": 0.000179018034728346, "loss": 0.86, "step": 19960 }, { "contrastive_loss": 3.7454833984375, "epoch": 2.3663307646710137, "mse_loss": 0.06797581911087036, "step": 19960 }, { "epoch": 2.3675163011262597, "grad_norm": 0.408203125, "learning_rate": 0.00017899269374538104, "loss": 0.8331, "step": 19970 }, { "contrastive_loss": 3.891357421875, "epoch": 2.3675163011262597, "mse_loss": 0.05645214766263962, "step": 19970 }, { "epoch": 2.3687018375815057, "grad_norm": 0.59765625, "learning_rate": 0.00017896733926472518, "loss": 0.8475, "step": 19980 }, { "contrastive_loss": 3.910400390625, "epoch": 2.3687018375815057, "mse_loss": 0.057815808802843094, "step": 19980 }, { "epoch": 2.3698873740367516, "grad_norm": 0.44140625, "learning_rate": 0.00017894197129071076, "loss": 0.8486, "step": 19990 }, { "contrastive_loss": 3.9840087890625, "epoch": 2.3698873740367516, "mse_loss": 0.04821095988154411, "step": 19990 }, { "epoch": 2.3710729104919976, "grad_norm": 0.5078125, "learning_rate": 0.00017891658982767254, "loss": 0.8433, "step": 20000 } ], "logging_steps": 10, "max_steps": 80000, "num_input_tokens_seen": 0, "num_train_epochs": 10, "save_steps": 20000, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 0.0, "train_batch_size": 32, "trial_name": null, "trial_params": null }