diff --git "a/phase-1-pretraining/logs/train.jsonl" "b/phase-1-pretraining/logs/train.jsonl" new file mode 100644--- /dev/null +++ "b/phase-1-pretraining/logs/train.jsonl" @@ -0,0 +1,1000 @@ +{"step": 0, "loss": 346.7655334472656, "lr": 5.994005994005993e-07, "time_ms": 3103.6784648895264, "eta_seconds": 31036.784648895264, "eta": "8:37:16", "timestamp": 1765119755.5383532} +{"step": 10, "loss": 340.015869140625, "lr": 6.593406593406593e-06, "time_ms": 2678.084135055542, "eta_seconds": 26754.060509204865, "eta": "7:25:54", "timestamp": 1765119782.2909086} +{"step": 20, "loss": 307.205078125, "lr": 1.2587412587412586e-05, "time_ms": 2679.382085800171, "eta_seconds": 26740.233216285706, "eta": "7:25:40", "timestamp": 1765119809.0909734} +{"step": 30, "loss": 219.22137451171875, "lr": 1.858141858141858e-05, "time_ms": 2681.1091899871826, "eta_seconds": 26730.65862417221, "eta": "7:25:30", "timestamp": 1765119835.9003806} +{"step": 40, "loss": 120.50293731689453, "lr": 2.4575424575424573e-05, "time_ms": 2680.757522583008, "eta_seconds": 26700.344924926758, "eta": "7:25:00", "timestamp": 1765119862.7110457} +{"step": 50, "loss": 73.25249481201172, "lr": 3.0569430569430565e-05, "time_ms": 2681.413173675537, "eta_seconds": 26680.061078071594, "eta": "7:24:40", "timestamp": 1765119889.5213668} +{"step": 60, "loss": 58.2353401184082, "lr": 3.656343656343656e-05, "time_ms": 2682.896137237549, "eta_seconds": 26667.987604141235, "eta": "7:24:27", "timestamp": 1765119916.354111} +{"step": 70, "loss": 48.106605529785156, "lr": 4.2557442557442556e-05, "time_ms": 2682.310104370117, "eta_seconds": 26635.339336395264, "eta": "7:23:55", "timestamp": 1765119943.1942616} +{"step": 80, "loss": 42.2056770324707, "lr": 4.855144855144855e-05, "time_ms": 2684.4685077667236, "eta_seconds": 26629.9275970459, "eta": "7:23:49", "timestamp": 1765119970.0385246} +{"step": 90, "loss": 39.07096862792969, "lr": 5.454545454545454e-05, "time_ms": 2684.32879447937, "eta_seconds": 26601.698353290558, "eta": "7:23:21", "timestamp": 1765119996.8823547} +{"step": 100, "loss": 36.518714904785156, "lr": 6.0539460539460535e-05, "time_ms": 2682.6841831207275, "eta_seconds": 26558.573412895203, "eta": "7:22:38", "timestamp": 1765120023.72426} +{"step": 110, "loss": 34.40033721923828, "lr": 6.653346653346653e-05, "time_ms": 2683.2849979400635, "eta_seconds": 26537.688629627228, "eta": "7:22:17", "timestamp": 1765120050.5640945} +{"step": 120, "loss": 33.52009201049805, "lr": 7.252747252747252e-05, "time_ms": 2683.140516281128, "eta_seconds": 26509.428300857544, "eta": "7:21:49", "timestamp": 1765120077.4049942} +{"step": 130, "loss": 31.94071388244629, "lr": 7.852147852147851e-05, "time_ms": 2683.8998794555664, "eta_seconds": 26490.09181022644, "eta": "7:21:30", "timestamp": 1765120104.246763} +{"step": 140, "loss": 31.385366439819336, "lr": 8.451548451548451e-05, "time_ms": 2681.9756031036377, "eta_seconds": 26444.279446601868, "eta": "7:20:44", "timestamp": 1765120131.0864935} +{"step": 150, "loss": 30.354520797729492, "lr": 9.05094905094905e-05, "time_ms": 2683.6555004119873, "eta_seconds": 26434.006679058075, "eta": "7:20:34", "timestamp": 1765120157.9309537} +{"step": 160, "loss": 30.034793853759766, "lr": 9.65034965034965e-05, "time_ms": 2682.577133178711, "eta_seconds": 26396.558990478516, "eta": "7:19:56", "timestamp": 1765120184.7717178} +{"step": 170, "loss": 29.688859939575195, "lr": 0.00010249750249750249, "time_ms": 2683.669090270996, "eta_seconds": 26380.46715736389, "eta": "7:19:40", "timestamp": 1765120211.6135983} +{"step": 180, "loss": 29.22146224975586, "lr": 0.00010849150849150848, "time_ms": 2683.2327842712402, "eta_seconds": 26349.34594154358, "eta": "7:19:09", "timestamp": 1765120238.455056} +{"step": 190, "loss": 28.208110809326172, "lr": 0.00011448551448551448, "time_ms": 2683.6156845092773, "eta_seconds": 26326.26986503601, "eta": "7:18:46", "timestamp": 1765120265.2976305} +{"step": 200, "loss": 28.17795753479004, "lr": 0.00012047952047952047, "time_ms": 2683.290481567383, "eta_seconds": 26296.24671936035, "eta": "7:18:16", "timestamp": 1765120292.1402917} +{"step": 210, "loss": 27.575517654418945, "lr": 0.00012647352647352647, "time_ms": 2684.7128868103027, "eta_seconds": 26283.339161872864, "eta": "7:18:03", "timestamp": 1765120318.986001} +{"step": 220, "loss": 26.767345428466797, "lr": 0.00013246753246753246, "time_ms": 2683.096408843994, "eta_seconds": 26240.682878494263, "eta": "7:17:20", "timestamp": 1765120345.8342094} +{"step": 230, "loss": 26.31460952758789, "lr": 0.00013846153846153847, "time_ms": 2686.1326694488525, "eta_seconds": 26243.51618051529, "eta": "7:17:23", "timestamp": 1765120372.6889124} +{"step": 240, "loss": 25.911911010742188, "lr": 0.00014445554445554444, "time_ms": 2686.924457550049, "eta_seconds": 26224.382705688477, "eta": "7:17:04", "timestamp": 1765120399.548299} +{"step": 250, "loss": 25.004718780517578, "lr": 0.00015044955044955042, "time_ms": 2685.2073669433594, "eta_seconds": 26180.771827697754, "eta": "7:16:20", "timestamp": 1765120426.4025605} +{"step": 260, "loss": 24.249658584594727, "lr": 0.00015644355644355644, "time_ms": 2684.635877609253, "eta_seconds": 26148.353447914124, "eta": "7:15:48", "timestamp": 1765120453.257643} +{"step": 270, "loss": 23.559293746948242, "lr": 0.00016243756243756243, "time_ms": 2686.68270111084, "eta_seconds": 26141.42268180847, "eta": "7:15:41", "timestamp": 1765120480.1153662} +{"step": 280, "loss": 23.364116668701172, "lr": 0.0001684315684315684, "time_ms": 2684.241771697998, "eta_seconds": 26090.83002090454, "eta": "7:14:50", "timestamp": 1765120506.9696681} +{"step": 290, "loss": 22.692651748657227, "lr": 0.0001744255744255744, "time_ms": 2683.720111846924, "eta_seconds": 26058.92228603363, "eta": "7:14:18", "timestamp": 1765120533.8199706} +{"step": 300, "loss": 21.707658767700195, "lr": 0.0001804195804195804, "time_ms": 2684.880018234253, "eta_seconds": 26043.336176872253, "eta": "7:14:03", "timestamp": 1765120560.6726272} +{"step": 310, "loss": 21.29494857788086, "lr": 0.0001864135864135864, "time_ms": 2685.8038902282715, "eta_seconds": 26025.43969631195, "eta": "7:13:45", "timestamp": 1765120587.5225558} +{"step": 320, "loss": 21.047264099121094, "lr": 0.0001924075924075924, "time_ms": 2684.3199729919434, "eta_seconds": 25984.21733856201, "eta": "7:13:04", "timestamp": 1765120614.374398} +{"step": 330, "loss": 20.149551391601562, "lr": 0.00019840159840159836, "time_ms": 2683.290481567383, "eta_seconds": 25947.41895675659, "eta": "7:12:27", "timestamp": 1765120641.2229927} +{"step": 340, "loss": 19.679216384887695, "lr": 0.00020439560439560438, "time_ms": 2684.8385334014893, "eta_seconds": 25935.540232658386, "eta": "7:12:15", "timestamp": 1765120668.0721009} +{"step": 350, "loss": 19.52688980102539, "lr": 0.00021038961038961036, "time_ms": 2684.537410736084, "eta_seconds": 25905.78601360321, "eta": "7:11:45", "timestamp": 1765120694.922882} +{"step": 360, "loss": 18.24361801147461, "lr": 0.00021638361638361638, "time_ms": 2684.95512008667, "eta_seconds": 25882.967357635498, "eta": "7:11:22", "timestamp": 1765120721.7713966} +{"step": 370, "loss": 17.947500228881836, "lr": 0.00022237762237762237, "time_ms": 2684.290885925293, "eta_seconds": 25849.72123146057, "eta": "7:10:49", "timestamp": 1765120748.6251478} +{"step": 380, "loss": 17.02100372314453, "lr": 0.00022837162837162833, "time_ms": 2684.752941131592, "eta_seconds": 25827.323293685913, "eta": "7:10:27", "timestamp": 1765120775.4779832} +{"step": 390, "loss": 16.443405151367188, "lr": 0.00023436563436563435, "time_ms": 2685.9965324401855, "eta_seconds": 25812.426676750183, "eta": "7:10:12", "timestamp": 1765120802.3303127} +{"step": 400, "loss": 15.751742362976074, "lr": 0.00024035964035964033, "time_ms": 2684.3559741973877, "eta_seconds": 25769.817352294922, "eta": "7:09:29", "timestamp": 1765120829.1757474} +{"step": 410, "loss": 15.244556427001953, "lr": 0.0002463536463536463, "time_ms": 2685.481309890747, "eta_seconds": 25753.765761852264, "eta": "7:09:13", "timestamp": 1765120856.0301971} +{"step": 420, "loss": 14.770166397094727, "lr": 0.00025234765234765234, "time_ms": 2684.7314834594727, "eta_seconds": 25719.727611541748, "eta": "7:08:39", "timestamp": 1765120882.8828816} +{"step": 430, "loss": 14.01164436340332, "lr": 0.00025834165834165835, "time_ms": 2685.4372024536133, "eta_seconds": 25699.63402748108, "eta": "7:08:19", "timestamp": 1765120909.7361364} +{"step": 440, "loss": 13.658737182617188, "lr": 0.0002643356643356643, "time_ms": 2685.0922107696533, "eta_seconds": 25669.481534957886, "eta": "7:07:49", "timestamp": 1765120936.5862927} +{"step": 450, "loss": 12.989947319030762, "lr": 0.0002703296703296703, "time_ms": 2684.4775676727295, "eta_seconds": 25636.760771274567, "eta": "7:07:16", "timestamp": 1765120963.4402497} +{"step": 460, "loss": 12.893111228942871, "lr": 0.0002763236763236763, "time_ms": 2684.481143951416, "eta_seconds": 25609.95011329651, "eta": "7:06:49", "timestamp": 1765120990.2906578} +{"step": 470, "loss": 12.253782272338867, "lr": 0.00028231768231768225, "time_ms": 2684.93914604187, "eta_seconds": 25587.470061779022, "eta": "7:06:27", "timestamp": 1765121017.1442094} +{"step": 480, "loss": 11.63758373260498, "lr": 0.00028831168831168827, "time_ms": 2685.370445251465, "eta_seconds": 25564.726638793945, "eta": "7:06:04", "timestamp": 1765121043.996428} +{"step": 490, "loss": 11.170119285583496, "lr": 0.0002943056943056943, "time_ms": 2683.7992668151855, "eta_seconds": 25522.931027412415, "eta": "7:05:22", "timestamp": 1765121070.8503807} +{"step": 500, "loss": 10.74889087677002, "lr": 0.0003002997002997003, "time_ms": 50592.29016304016, "eta_seconds": 480626.75654888153, "eta": "5 days, 13:30:26", "timestamp": 1765121145.6115067} +{"step": 510, "loss": 10.464680671691895, "lr": 0.00030629370629370626, "time_ms": 2684.276342391968, "eta_seconds": 25473.782489299774, "eta": "7:04:33", "timestamp": 1765121172.454694} +{"step": 520, "loss": 10.157018661499023, "lr": 0.0003122877122877123, "time_ms": 2684.4561100006104, "eta_seconds": 25448.643922805786, "eta": "7:04:08", "timestamp": 1765121199.3023608} +{"step": 530, "loss": 9.71251392364502, "lr": 0.0003182817182817183, "time_ms": 2685.8766078948975, "eta_seconds": 25435.25147676468, "eta": "7:03:55", "timestamp": 1765121226.152674} +{"step": 540, "loss": 9.375505447387695, "lr": 0.0003242757242757242, "time_ms": 2684.929847717285, "eta_seconds": 25399.436359405518, "eta": "7:03:19", "timestamp": 1765121253.0055754} +{"step": 550, "loss": 9.244869232177734, "lr": 0.0003302697302697302, "time_ms": 2685.9726905822754, "eta_seconds": 25382.441926002502, "eta": "7:03:02", "timestamp": 1765121279.8631773} +{"step": 560, "loss": 8.83364486694336, "lr": 0.00033626373626373623, "time_ms": 2684.5498085021973, "eta_seconds": 25342.150192260742, "eta": "7:02:22", "timestamp": 1765121306.7228742} +{"step": 570, "loss": 8.691001892089844, "lr": 0.0003422577422577422, "time_ms": 2685.6749057769775, "eta_seconds": 25325.9143614769, "eta": "7:02:05", "timestamp": 1765121333.580086} +{"step": 580, "loss": 8.422346115112305, "lr": 0.0003482517482517482, "time_ms": 2686.0482692718506, "eta_seconds": 25302.574696540833, "eta": "7:01:42", "timestamp": 1765121360.4389098} +{"step": 590, "loss": 8.136713027954102, "lr": 0.0003542457542457542, "time_ms": 2685.2028369903564, "eta_seconds": 25267.758696079254, "eta": "7:01:07", "timestamp": 1765121387.2989519} +{"step": 600, "loss": 7.853506565093994, "lr": 0.00036023976023976024, "time_ms": 2685.605525970459, "eta_seconds": 25244.691944122314, "eta": "7:00:44", "timestamp": 1765121414.1582808} +{"step": 610, "loss": 7.757828235626221, "lr": 0.0003662337662337662, "time_ms": 2685.307741165161, "eta_seconds": 25215.039689540863, "eta": "7:00:15", "timestamp": 1765121441.0180404} +{"step": 620, "loss": 7.671686172485352, "lr": 0.0003722277722277722, "time_ms": 2685.6460571289062, "eta_seconds": 25191.36001586914, "eta": "6:59:51", "timestamp": 1765121467.877593} +{"step": 630, "loss": 7.621791839599609, "lr": 0.00037822177822177823, "time_ms": 2685.410261154175, "eta_seconds": 25162.294147014618, "eta": "6:59:22", "timestamp": 1765121494.7407098} +{"step": 640, "loss": 7.464466571807861, "lr": 0.00038421578421578414, "time_ms": 2685.8890056610107, "eta_seconds": 25139.92109298706, "eta": "6:58:59", "timestamp": 1765121521.6027257} +{"step": 650, "loss": 7.440684795379639, "lr": 0.00039020979020979016, "time_ms": 2685.9965324401855, "eta_seconds": 25114.067578315735, "eta": "6:58:34", "timestamp": 1765121548.4617672} +{"step": 660, "loss": 7.184878349304199, "lr": 0.0003962037962037962, "time_ms": 2686.110258102417, "eta_seconds": 25088.269810676575, "eta": "6:58:08", "timestamp": 1765121575.3242047} +{"step": 670, "loss": 7.3195061683654785, "lr": 0.00040219780219780213, "time_ms": 2685.7752799987793, "eta_seconds": 25058.28336238861, "eta": "6:57:38", "timestamp": 1765121602.1865685} +{"step": 680, "loss": 7.2969584465026855, "lr": 0.00040819180819180815, "time_ms": 2686.6254806518555, "eta_seconds": 25039.349479675293, "eta": "6:57:19", "timestamp": 1765121629.050249} +{"step": 690, "loss": 7.042532920837402, "lr": 0.00041418581418581417, "time_ms": 2686.09619140625, "eta_seconds": 25007.555541992188, "eta": "6:56:47", "timestamp": 1765121655.9154713} +{"step": 700, "loss": 7.124141216278076, "lr": 0.00042017982017982013, "time_ms": 2684.8886013031006, "eta_seconds": 24969.463992118835, "eta": "6:56:09", "timestamp": 1765121682.7800746} +{"step": 710, "loss": 6.965004920959473, "lr": 0.00042617382617382614, "time_ms": 2686.56587600708, "eta_seconds": 24958.196988105774, "eta": "6:55:58", "timestamp": 1765121709.6425798} +{"step": 720, "loss": 7.090205669403076, "lr": 0.00043216783216783216, "time_ms": 2686.3348484039307, "eta_seconds": 24929.187393188477, "eta": "6:55:29", "timestamp": 1765121736.5063298} +{"step": 730, "loss": 7.000826835632324, "lr": 0.0004381618381618381, "time_ms": 2684.6728324890137, "eta_seconds": 24886.917157173157, "eta": "6:54:46", "timestamp": 1765121763.3656955} +{"step": 740, "loss": 6.89832878112793, "lr": 0.0004441558441558441, "time_ms": 2684.767961502075, "eta_seconds": 24860.951323509216, "eta": "6:54:20", "timestamp": 1765121790.2255142} +{"step": 750, "loss": 6.939929962158203, "lr": 0.0004501498501498501, "time_ms": 2685.83083152771, "eta_seconds": 24843.935191631317, "eta": "6:54:03", "timestamp": 1765121817.0816624} +{"step": 760, "loss": 6.83512544631958, "lr": 0.0004561438561438561, "time_ms": 2685.668468475342, "eta_seconds": 24815.57664871216, "eta": "6:53:35", "timestamp": 1765121843.9363298} +{"step": 770, "loss": 6.759770393371582, "lr": 0.0004621378621378621, "time_ms": 2686.134099960327, "eta_seconds": 24793.01774263382, "eta": "6:53:13", "timestamp": 1765121870.7992418} +{"step": 780, "loss": 6.887198448181152, "lr": 0.0004681318681318681, "time_ms": 2686.600685119629, "eta_seconds": 24770.45831680298, "eta": "6:52:50", "timestamp": 1765121897.6636226} +{"step": 790, "loss": 6.741876125335693, "lr": 0.0004741258741258741, "time_ms": 2684.7281455993652, "eta_seconds": 24726.346220970154, "eta": "6:52:06", "timestamp": 1765121924.528988} +{"step": 800, "loss": 6.704683780670166, "lr": 0.00048011988011988007, "time_ms": 2689.269542694092, "eta_seconds": 24741.279792785645, "eta": "6:52:21", "timestamp": 1765121951.400036} +{"step": 810, "loss": 6.5955047607421875, "lr": 0.0004861138861138861, "time_ms": 2685.23907661438, "eta_seconds": 24677.34711408615, "eta": "6:51:17", "timestamp": 1765121978.265252} +{"step": 820, "loss": 6.646420001983643, "lr": 0.0004921078921078921, "time_ms": 2685.8112812042236, "eta_seconds": 24655.747561454773, "eta": "6:50:55", "timestamp": 1765122005.135324} +{"step": 830, "loss": 6.598686218261719, "lr": 0.000498101898101898, "time_ms": 2685.8577728271484, "eta_seconds": 24629.31577682495, "eta": "6:50:29", "timestamp": 1765122032.006535} +{"step": 840, "loss": 6.565834999084473, "lr": 0.000504095904095904, "time_ms": 2685.3716373443604, "eta_seconds": 24598.00419807434, "eta": "6:49:58", "timestamp": 1765122058.8758988} +{"step": 850, "loss": 6.528083801269531, "lr": 0.00051008991008991, "time_ms": 2685.727596282959, "eta_seconds": 24574.407505989075, "eta": "6:49:34", "timestamp": 1765122085.7438421} +{"step": 860, "loss": 6.440849304199219, "lr": 0.000516083916083916, "time_ms": 2687.0501041412354, "eta_seconds": 24559.63795185089, "eta": "6:49:19", "timestamp": 1765122112.612876} +{"step": 870, "loss": 6.455558776855469, "lr": 0.0005220779220779221, "time_ms": 2686.4538192749023, "eta_seconds": 24527.32336997986, "eta": "6:48:47", "timestamp": 1765122139.4836102} +{"step": 880, "loss": 6.385119438171387, "lr": 0.0005280719280719281, "time_ms": 2685.9142780303955, "eta_seconds": 24495.538215637207, "eta": "6:48:15", "timestamp": 1765122166.3486774} +{"step": 890, "loss": 6.395497798919678, "lr": 0.000534065934065934, "time_ms": 2686.5530014038086, "eta_seconds": 24474.497842788696, "eta": "6:47:54", "timestamp": 1765122193.2187178} +{"step": 900, "loss": 6.3999528884887695, "lr": 0.00054005994005994, "time_ms": 2686.0904693603516, "eta_seconds": 24443.4232711792, "eta": "6:47:23", "timestamp": 1765122220.0838802} +{"step": 910, "loss": 6.584550380706787, "lr": 0.000546053946053946, "time_ms": 2687.281608581543, "eta_seconds": 24427.389822006226, "eta": "6:47:07", "timestamp": 1765122246.9554513} +{"step": 920, "loss": 6.415899753570557, "lr": 0.000552047952047952, "time_ms": 2686.6979598999023, "eta_seconds": 24395.217475891113, "eta": "6:46:35", "timestamp": 1765122273.8305373} +{"step": 930, "loss": 6.432614326477051, "lr": 0.0005580419580419581, "time_ms": 2686.631202697754, "eta_seconds": 24367.745008468628, "eta": "6:46:07", "timestamp": 1765122300.7060165} +{"step": 940, "loss": 6.357086658477783, "lr": 0.0005640359640359641, "time_ms": 2687.2456073760986, "eta_seconds": 24346.445202827454, "eta": "6:45:46", "timestamp": 1765122327.5820844} +{"step": 950, "loss": 6.279504299163818, "lr": 0.00057002997002997, "time_ms": 2686.1038208007812, "eta_seconds": 24309.23957824707, "eta": "6:45:09", "timestamp": 1765122354.4642818} +{"step": 960, "loss": 6.364739894866943, "lr": 0.000576023976023976, "time_ms": 2687.244653701782, "eta_seconds": 24292.69166946411, "eta": "6:44:52", "timestamp": 1765122381.3391218} +{"step": 970, "loss": 6.381607532501221, "lr": 0.0005820179820179819, "time_ms": 2688.206672668457, "eta_seconds": 24274.506254196167, "eta": "6:44:34", "timestamp": 1765122408.222101} +{"step": 980, "loss": 6.158621788024902, "lr": 0.0005880119880119879, "time_ms": 2687.0269775390625, "eta_seconds": 24236.983337402344, "eta": "6:43:56", "timestamp": 1765122435.1035419} +{"step": 990, "loss": 6.173436641693115, "lr": 0.0005940059940059939, "time_ms": 2688.02547454834, "eta_seconds": 24219.109525680542, "eta": "6:43:39", "timestamp": 1765122461.982508} +{"step": 1000, "loss": 6.1511664390563965, "lr": 0.0006, "time_ms": 52750.64706802368, "eta_seconds": 474755.82361221313, "eta": "5 days, 11:52:35", "timestamp": 1765122538.9253614} +{"step": 1010, "loss": 6.143887996673584, "lr": 0.0005999983550676034, "time_ms": 2688.1625652313232, "eta_seconds": 24166.581461429596, "eta": "6:42:46", "timestamp": 1765122565.7994134} +{"step": 1020, "loss": 6.213443756103516, "lr": 0.0005999934202904565, "time_ms": 2689.4900798797607, "eta_seconds": 24151.62091732025, "eta": "6:42:31", "timestamp": 1765122592.699499} +{"step": 1030, "loss": 6.061520576477051, "lr": 0.0005999851957286882, "time_ms": 2689.7153854370117, "eta_seconds": 24126.747007369995, "eta": "6:42:06", "timestamp": 1765122619.599735} +{"step": 1040, "loss": 6.144708633422852, "lr": 0.0005999736814825121, "time_ms": 2688.9772415161133, "eta_seconds": 24093.236083984375, "eta": "6:41:33", "timestamp": 1765122646.5007746} +{"step": 1050, "loss": 6.147915840148926, "lr": 0.0005999588776922256, "time_ms": 2690.8462047576904, "eta_seconds": 24083.07353258133, "eta": "6:41:23", "timestamp": 1765122673.4030704} +{"step": 1060, "loss": 6.081887245178223, "lr": 0.0005999407845382082, "time_ms": 2689.561367034912, "eta_seconds": 24044.678621292114, "eta": "6:40:44", "timestamp": 1765122700.3028483} +{"step": 1070, "loss": 5.944100856781006, "lr": 0.0005999194022409194, "time_ms": 2688.474178314209, "eta_seconds": 24008.074412345886, "eta": "6:40:08", "timestamp": 1765122727.2013466} +{"step": 1080, "loss": 5.950677394866943, "lr": 0.0005998947310608956, "time_ms": 2688.8089179992676, "eta_seconds": 23984.175548553467, "eta": "6:39:44", "timestamp": 1765122754.1022463} +{"step": 1090, "loss": 5.9500627517700195, "lr": 0.0005998667712987475, "time_ms": 2689.481258392334, "eta_seconds": 23963.278012275696, "eta": "6:39:23", "timestamp": 1765122780.9994802} +{"step": 1100, "loss": 6.030828475952148, "lr": 0.0005998355232951559, "time_ms": 2689.6204948425293, "eta_seconds": 23937.62240409851, "eta": "6:38:57", "timestamp": 1765122807.900335} +{"step": 1110, "loss": 5.883779048919678, "lr": 0.0005998009874308676, "time_ms": 2691.0197734832764, "eta_seconds": 23923.165786266327, "eta": "6:38:43", "timestamp": 1765122834.8027976} +{"step": 1120, "loss": 5.959603309631348, "lr": 0.0005997631641266917, "time_ms": 2689.3434524536133, "eta_seconds": 23881.369857788086, "eta": "6:38:01", "timestamp": 1765122861.7046688} +{"step": 1130, "loss": 5.959445953369141, "lr": 0.0005997220538434929, "time_ms": 2689.669132232666, "eta_seconds": 23857.365202903748, "eta": "6:37:37", "timestamp": 1765122888.6093028} +{"step": 1140, "loss": 5.868113994598389, "lr": 0.0005996776570821871, "time_ms": 2688.1940364837646, "eta_seconds": 23817.399163246155, "eta": "6:36:57", "timestamp": 1765122915.5074015} +{"step": 1150, "loss": 5.774717807769775, "lr": 0.0005996299743837349, "time_ms": 2690.021753311157, "eta_seconds": 23806.69251680374, "eta": "6:36:46", "timestamp": 1765122942.406164} +{"step": 1160, "loss": 5.775592803955078, "lr": 0.0005995790063291348, "time_ms": 2689.711809158325, "eta_seconds": 23777.052392959595, "eta": "6:36:17", "timestamp": 1765122969.3085918} +{"step": 1170, "loss": 5.86311674118042, "lr": 0.0005995247535394166, "time_ms": 2688.911199569702, "eta_seconds": 23743.08589220047, "eta": "6:35:43", "timestamp": 1765122996.213499} +{"step": 1180, "loss": 5.816684722900391, "lr": 0.0005994672166756333, "time_ms": 2689.279317855835, "eta_seconds": 23719.443583488464, "eta": "6:35:19", "timestamp": 1765123023.1138358} +{"step": 1190, "loss": 5.800718784332275, "lr": 0.0005994063964388535, "time_ms": 2688.938617706299, "eta_seconds": 23689.549221992493, "eta": "6:34:49", "timestamp": 1765123050.0123057} +{"step": 1200, "loss": 5.64614200592041, "lr": 0.0005993422935701524, "time_ms": 2688.7292861938477, "eta_seconds": 23660.81771850586, "eta": "6:34:20", "timestamp": 1765123076.9142306} +{"step": 1210, "loss": 5.775592803955078, "lr": 0.0005992749088506036, "time_ms": 2689.058780670166, "eta_seconds": 23636.82668209076, "eta": "6:33:56", "timestamp": 1765123103.8150866} +{"step": 1220, "loss": 5.688136577606201, "lr": 0.0005992042431012685, "time_ms": 2689.5649433135986, "eta_seconds": 23614.380202293396, "eta": "6:33:34", "timestamp": 1765123130.714806} +{"step": 1230, "loss": 5.592213153839111, "lr": 0.0005991302971831867, "time_ms": 2690.415143966675, "eta_seconds": 23594.940812587738, "eta": "6:33:14", "timestamp": 1765123157.615186} +{"step": 1240, "loss": 5.573948860168457, "lr": 0.0005990530719973661, "time_ms": 2690.1841163635254, "eta_seconds": 23566.012859344482, "eta": "6:32:46", "timestamp": 1765123184.5143056} +{"step": 1250, "loss": 5.54298210144043, "lr": 0.0005989725684847712, "time_ms": 2690.5720233917236, "eta_seconds": 23542.50520467758, "eta": "6:32:22", "timestamp": 1765123211.4161212} +{"step": 1260, "loss": 5.603926181793213, "lr": 0.0005988887876263119, "time_ms": 2688.910484313965, "eta_seconds": 23501.077632904053, "eta": "6:31:41", "timestamp": 1765123238.3158803} +{"step": 1270, "loss": 5.569946765899658, "lr": 0.0005988017304428316, "time_ms": 2689.2940998077393, "eta_seconds": 23477.537491321564, "eta": "6:31:17", "timestamp": 1765123265.2153165} +{"step": 1280, "loss": 5.528009414672852, "lr": 0.0005987113979950944, "time_ms": 2690.838575363159, "eta_seconds": 23464.112377166748, "eta": "6:31:04", "timestamp": 1765123292.1210725} +{"step": 1290, "loss": 5.697690963745117, "lr": 0.0005986177913837728, "time_ms": 2690.0644302368164, "eta_seconds": 23430.46118736267, "eta": "6:30:30", "timestamp": 1765123319.0226107} +{"step": 1300, "loss": 5.562711715698242, "lr": 0.0005985209117494337, "time_ms": 2690.053939819336, "eta_seconds": 23403.469276428223, "eta": "6:30:03", "timestamp": 1765123345.9243383} +{"step": 1310, "loss": 5.477464199066162, "lr": 0.0005984207602725251, "time_ms": 2689.4326210021973, "eta_seconds": 23371.169476509094, "eta": "6:29:31", "timestamp": 1765123372.827006} +{"step": 1320, "loss": 5.5441083908081055, "lr": 0.000598317338173361, "time_ms": 2689.7928714752197, "eta_seconds": 23347.402124404907, "eta": "6:29:07", "timestamp": 1765123399.728433} +{"step": 1330, "loss": 5.481055736541748, "lr": 0.000598210646712107, "time_ms": 2689.0063285827637, "eta_seconds": 23313.68486881256, "eta": "6:28:33", "timestamp": 1765123426.626512} +{"step": 1340, "loss": 5.590710639953613, "lr": 0.0005981006871887649, "time_ms": 2689.6700859069824, "eta_seconds": 23292.542943954468, "eta": "6:28:12", "timestamp": 1765123453.5275724} +{"step": 1350, "loss": 5.507302761077881, "lr": 0.0005979874609431569, "time_ms": 2690.3316974639893, "eta_seconds": 23271.369183063507, "eta": "6:27:51", "timestamp": 1765123480.427398} +{"step": 1360, "loss": 5.357255935668945, "lr": 0.000597870969354909, "time_ms": 2689.1226768493652, "eta_seconds": 23234.019927978516, "eta": "6:27:14", "timestamp": 1765123507.3267548} +{"step": 1370, "loss": 5.371493339538574, "lr": 0.0005977512138434343, "time_ms": 2688.5745525360107, "eta_seconds": 23202.398388385773, "eta": "6:26:42", "timestamp": 1765123534.2281713} +{"step": 1380, "loss": 5.406754970550537, "lr": 0.0005976281958679162, "time_ms": 2690.5357837677, "eta_seconds": 23192.418456077576, "eta": "6:26:32", "timestamp": 1765123561.1328943} +{"step": 1390, "loss": 5.3553972244262695, "lr": 0.0005975019169272897, "time_ms": 2689.5699501037598, "eta_seconds": 23157.19727039337, "eta": "6:25:57", "timestamp": 1765123588.0342567} +{"step": 1400, "loss": 5.363597393035889, "lr": 0.000597372378560224, "time_ms": 2689.809799194336, "eta_seconds": 23132.36427307129, "eta": "6:25:32", "timestamp": 1765123614.9351118} +{"step": 1410, "loss": 5.279834270477295, "lr": 0.000597239582345103, "time_ms": 2690.551996231079, "eta_seconds": 23111.84164762497, "eta": "6:25:11", "timestamp": 1765123641.8347948} +{"step": 1420, "loss": 5.355911731719971, "lr": 0.0005971035299000069, "time_ms": 2690.371036529541, "eta_seconds": 23083.383493423462, "eta": "6:24:43", "timestamp": 1765123668.73617} +{"step": 1430, "loss": 5.340585708618164, "lr": 0.0005969642228826915, "time_ms": 2688.040018081665, "eta_seconds": 23036.50295495987, "eta": "6:23:56", "timestamp": 1765123695.6299567} +{"step": 1440, "loss": 5.435864448547363, "lr": 0.0005968216629905692, "time_ms": 2689.3234252929688, "eta_seconds": 23020.608520507812, "eta": "6:23:40", "timestamp": 1765123722.5254517} +{"step": 1450, "loss": 5.355688095092773, "lr": 0.0005966758519606872, "time_ms": 2689.2354488372803, "eta_seconds": 22992.963087558746, "eta": "6:23:12", "timestamp": 1765123749.4258678} +{"step": 1460, "loss": 5.241639614105225, "lr": 0.0005965267915697067, "time_ms": 2688.742160797119, "eta_seconds": 22961.858053207397, "eta": "6:22:41", "timestamp": 1765123776.3245196} +{"step": 1470, "loss": 5.266523361206055, "lr": 0.0005963744836338816, "time_ms": 2690.6824111938477, "eta_seconds": 22951.52096748352, "eta": "6:22:31", "timestamp": 1765123803.224314} +{"step": 1480, "loss": 5.196133613586426, "lr": 0.0005962189300090363, "time_ms": 2691.359519958496, "eta_seconds": 22930.383110046387, "eta": "6:22:10", "timestamp": 1765123830.1270502} +{"step": 1490, "loss": 5.191649436950684, "lr": 0.0005960601325905423, "time_ms": 2690.066337585449, "eta_seconds": 22892.464532852173, "eta": "6:21:32", "timestamp": 1765123857.0320933} +{"step": 1500, "loss": 5.247959136962891, "lr": 0.0005958980933132962, "time_ms": 52791.23902320862, "eta_seconds": 448725.53169727325, "eta": "5 days, 4:38:45", "timestamp": 1765123934.0361476} +{"step": 1510, "loss": 5.32852029800415, "lr": 0.0005957328141516952, "time_ms": 2689.5833015441895, "eta_seconds": 22834.56223011017, "eta": "6:20:34", "timestamp": 1765123960.9241555} +{"step": 1520, "loss": 5.078707218170166, "lr": 0.0005955642971196142, "time_ms": 2689.277410507202, "eta_seconds": 22805.072441101074, "eta": "6:20:05", "timestamp": 1765123987.8239088} +{"step": 1530, "loss": 5.228704929351807, "lr": 0.0005953925442703796, "time_ms": 2689.476251602173, "eta_seconds": 22779.863851070404, "eta": "6:19:39", "timestamp": 1765124014.7247176} +{"step": 1540, "loss": 5.176631927490234, "lr": 0.000595217557696746, "time_ms": 2690.0246143341064, "eta_seconds": 22757.60823726654, "eta": "6:19:17", "timestamp": 1765124041.6271713} +{"step": 1550, "loss": 5.267725944519043, "lr": 0.0005950393395308692, "time_ms": 2690.298557281494, "eta_seconds": 22733.022809028625, "eta": "6:18:53", "timestamp": 1765124068.5301373} +{"step": 1560, "loss": 5.0185546875, "lr": 0.0005948578919442816, "time_ms": 2690.1421546936035, "eta_seconds": 22704.799785614014, "eta": "6:18:24", "timestamp": 1765124095.4325} +{"step": 1570, "loss": 5.176824569702148, "lr": 0.0005946732171478649, "time_ms": 2689.6560192108154, "eta_seconds": 22673.800241947174, "eta": "6:17:53", "timestamp": 1765124122.3368633} +{"step": 1580, "loss": 5.131961345672607, "lr": 0.0005944853173918229, "time_ms": 2689.350128173828, "eta_seconds": 22644.328079223633, "eta": "6:17:24", "timestamp": 1765124149.2405825} +{"step": 1590, "loss": 5.163421630859375, "lr": 0.0005942941949656549, "time_ms": 2689.868211746216, "eta_seconds": 22621.791660785675, "eta": "6:17:01", "timestamp": 1765124176.143893} +{"step": 1600, "loss": 5.184752464294434, "lr": 0.0005940998521981274, "time_ms": 2689.5687580108643, "eta_seconds": 22592.37756729126, "eta": "6:16:32", "timestamp": 1765124203.0448341} +{"step": 1610, "loss": 5.112778663635254, "lr": 0.0005939022914572459, "time_ms": 2688.4093284606934, "eta_seconds": 22555.754265785217, "eta": "6:15:55", "timestamp": 1765124229.9510524} +{"step": 1620, "loss": 5.1714324951171875, "lr": 0.0005937015151502253, "time_ms": 2690.5524730682373, "eta_seconds": 22546.82972431183, "eta": "6:15:46", "timestamp": 1765124256.8535714} +{"step": 1630, "loss": 4.985273361206055, "lr": 0.0005934975257234617, "time_ms": 2688.6672973632812, "eta_seconds": 22504.145278930664, "eta": "6:15:04", "timestamp": 1765124283.7578146} +{"step": 1640, "loss": 5.042994976043701, "lr": 0.000593290325662502, "time_ms": 2689.197301864624, "eta_seconds": 22481.689443588257, "eta": "6:14:41", "timestamp": 1765124310.6609461} +{"step": 1650, "loss": 4.992228031158447, "lr": 0.0005930799174920135, "time_ms": 2690.4051303863525, "eta_seconds": 22464.882838726044, "eta": "6:14:24", "timestamp": 1765124337.5628526} +{"step": 1660, "loss": 5.010766506195068, "lr": 0.0005928663037757532, "time_ms": 2689.666509628296, "eta_seconds": 22431.818690299988, "eta": "6:13:51", "timestamp": 1765124364.4657145} +{"step": 1670, "loss": 4.953133583068848, "lr": 0.0005926494871165371, "time_ms": 2689.713478088379, "eta_seconds": 22405.313272476196, "eta": "6:13:25", "timestamp": 1765124391.366104} +{"step": 1680, "loss": 4.9790120124816895, "lr": 0.0005924294701562075, "time_ms": 2688.25364112854, "eta_seconds": 22366.270294189453, "eta": "6:12:46", "timestamp": 1765124418.2587678} +{"step": 1690, "loss": 4.86929988861084, "lr": 0.0005922062555756017, "time_ms": 2688.2002353668213, "eta_seconds": 22338.943955898285, "eta": "6:12:18", "timestamp": 1765124445.1397734} +{"step": 1700, "loss": 5.062023639678955, "lr": 0.000591979846094519, "time_ms": 2689.194917678833, "eta_seconds": 22320.317816734314, "eta": "6:12:00", "timestamp": 1765124472.0266626} +{"step": 1710, "loss": 4.921777248382568, "lr": 0.0005917502444716875, "time_ms": 2687.8154277801514, "eta_seconds": 22281.989896297455, "eta": "6:11:21", "timestamp": 1765124498.923863} +{"step": 1720, "loss": 4.832278251647949, "lr": 0.0005915174535047304, "time_ms": 2690.0792121887207, "eta_seconds": 22273.855876922607, "eta": "6:11:13", "timestamp": 1765124525.8243341} +{"step": 1730, "loss": 5.000360488891602, "lr": 0.0005912814760301322, "time_ms": 2689.5461082458496, "eta_seconds": 22242.546315193176, "eta": "6:10:42", "timestamp": 1765124552.7244072} +{"step": 1740, "loss": 4.8151164054870605, "lr": 0.000591042314923204, "time_ms": 2691.019296646118, "eta_seconds": 22227.819390296936, "eta": "6:10:27", "timestamp": 1765124579.6232278} +{"step": 1750, "loss": 4.849522590637207, "lr": 0.0005907999730980484, "time_ms": 2689.249038696289, "eta_seconds": 22186.304569244385, "eta": "6:09:46", "timestamp": 1765124606.5230172} +{"step": 1760, "loss": 4.961391448974609, "lr": 0.000590554453507524, "time_ms": 2689.666986465454, "eta_seconds": 22162.85596847534, "eta": "6:09:22", "timestamp": 1765124633.4262755} +{"step": 1770, "loss": 4.8241400718688965, "lr": 0.0005903057591432097, "time_ms": 2689.9256706237793, "eta_seconds": 22138.088269233704, "eta": "6:08:58", "timestamp": 1765124660.3283496} +{"step": 1780, "loss": 4.888782501220703, "lr": 0.0005900538930353677, "time_ms": 2689.969301223755, "eta_seconds": 22111.547656059265, "eta": "6:08:31", "timestamp": 1765124687.2323804} +{"step": 1790, "loss": 4.8769612312316895, "lr": 0.000589798858252907, "time_ms": 2689.8393630981445, "eta_seconds": 22083.581171035767, "eta": "6:08:03", "timestamp": 1765124714.1317272} +{"step": 1800, "loss": 4.846798419952393, "lr": 0.000589540657903346, "time_ms": 2689.652442932129, "eta_seconds": 22055.150032043457, "eta": "6:07:35", "timestamp": 1765124741.0340238} +{"step": 1810, "loss": 4.916466236114502, "lr": 0.0005892792951327746, "time_ms": 2690.0696754455566, "eta_seconds": 22031.67064189911, "eta": "6:07:11", "timestamp": 1765124767.9360616} +{"step": 1820, "loss": 4.7886247634887695, "lr": 0.0005890147731258154, "time_ms": 2687.9754066467285, "eta_seconds": 21987.63882637024, "eta": "6:06:27", "timestamp": 1765124794.8263743} +{"step": 1830, "loss": 4.800199508666992, "lr": 0.0005887470951055859, "time_ms": 2689.6233558654785, "eta_seconds": 21974.22281742096, "eta": "6:06:14", "timestamp": 1765124821.7199373} +{"step": 1840, "loss": 4.767756462097168, "lr": 0.000588476264333658, "time_ms": 2690.0880336761475, "eta_seconds": 21951.118354797363, "eta": "6:05:51", "timestamp": 1765124848.6208858} +{"step": 1850, "loss": 4.776322841644287, "lr": 0.0005882022841100196, "time_ms": 2688.704490661621, "eta_seconds": 21912.941598892212, "eta": "6:05:12", "timestamp": 1765124875.5212204} +{"step": 1860, "loss": 4.576502799987793, "lr": 0.0005879251577730327, "time_ms": 2689.521074295044, "eta_seconds": 21892.701544761658, "eta": "6:04:52", "timestamp": 1765124902.4222882} +{"step": 1870, "loss": 4.655456066131592, "lr": 0.0005876448886993947, "time_ms": 2688.2739067077637, "eta_seconds": 21855.66686153412, "eta": "6:04:15", "timestamp": 1765124929.319978} +{"step": 1880, "loss": 4.768405914306641, "lr": 0.0005873614803040957, "time_ms": 2689.3739700317383, "eta_seconds": 21837.716636657715, "eta": "6:03:57", "timestamp": 1765124956.2175124} +{"step": 1890, "loss": 4.8236799240112305, "lr": 0.0005870749360403774, "time_ms": 2690.519332885742, "eta_seconds": 21820.11178970337, "eta": "6:03:40", "timestamp": 1765124983.1161835} +{"step": 1900, "loss": 4.86521577835083, "lr": 0.0005867852593996914, "time_ms": 2690.5503273010254, "eta_seconds": 21793.457651138306, "eta": "6:03:13", "timestamp": 1765125010.0160465} +{"step": 1910, "loss": 4.716339588165283, "lr": 0.0005864924539116561, "time_ms": 2688.3695125579834, "eta_seconds": 21748.909356594086, "eta": "6:02:28", "timestamp": 1765125036.915023} +{"step": 1920, "loss": 4.827800750732422, "lr": 0.000586196523144014, "time_ms": 2689.4869804382324, "eta_seconds": 21731.054801940918, "eta": "6:02:11", "timestamp": 1765125063.8155928} +{"step": 1930, "loss": 4.738182544708252, "lr": 0.0005858974707025881, "time_ms": 2691.1165714263916, "eta_seconds": 21717.31073141098, "eta": "6:01:57", "timestamp": 1765125090.718251} +{"step": 1940, "loss": 4.590117454528809, "lr": 0.0005855953002312379, "time_ms": 2689.223289489746, "eta_seconds": 21675.139713287354, "eta": "6:01:15", "timestamp": 1765125117.6225004} +{"step": 1950, "loss": 4.471175193786621, "lr": 0.0005852900154118155, "time_ms": 2690.491199493408, "eta_seconds": 21658.454155921936, "eta": "6:00:58", "timestamp": 1765125144.5258706} +{"step": 1960, "loss": 4.581606388092041, "lr": 0.0005849816199641198, "time_ms": 2690.1652812957764, "eta_seconds": 21628.928861618042, "eta": "6:00:28", "timestamp": 1765125171.4323215} +{"step": 1970, "loss": 4.5900750160217285, "lr": 0.0005846701176458522, "time_ms": 2690.5159950256348, "eta_seconds": 21604.843440055847, "eta": "6:00:04", "timestamp": 1765125198.3371727} +{"step": 1980, "loss": 4.622983455657959, "lr": 0.0005843555122525701, "time_ms": 2690.4196739196777, "eta_seconds": 21577.165784835815, "eta": "5:59:37", "timestamp": 1765125225.2425902} +{"step": 1990, "loss": 4.545095920562744, "lr": 0.0005840378076176409, "time_ms": 2688.927173614502, "eta_seconds": 21538.30666065216, "eta": "5:58:58", "timestamp": 1765125252.1466713} +{"step": 2000, "loss": 4.631114959716797, "lr": 0.0005837170076121953, "time_ms": 52745.16439437866, "eta_seconds": 421961.3151550293, "eta": "4 days, 21:12:41", "timestamp": 1765125329.106254} +{"step": 2010, "loss": 4.499159812927246, "lr": 0.0005833931161450801, "time_ms": 2689.854383468628, "eta_seconds": 21491.936523914337, "eta": "5:58:11", "timestamp": 1765125355.9915245} +{"step": 2020, "loss": 4.651795387268066, "lr": 0.0005830661371628107, "time_ms": 2689.852714538574, "eta_seconds": 21465.024662017822, "eta": "5:57:45", "timestamp": 1765125382.8874786} +{"step": 2030, "loss": 4.451202392578125, "lr": 0.0005827360746495227, "time_ms": 2689.743995666504, "eta_seconds": 21437.259645462036, "eta": "5:57:17", "timestamp": 1765125409.7849338} +{"step": 2040, "loss": 4.467798709869385, "lr": 0.0005824029326269238, "time_ms": 2689.3551349639893, "eta_seconds": 21407.266874313354, "eta": "5:56:47", "timestamp": 1765125436.6876693} +{"step": 2050, "loss": 4.444151878356934, "lr": 0.0005820667151542444, "time_ms": 2688.728094100952, "eta_seconds": 21375.38834810257, "eta": "5:56:15", "timestamp": 1765125463.587287} +{"step": 2060, "loss": 4.495687961578369, "lr": 0.0005817274263281882, "time_ms": 2690.3722286224365, "eta_seconds": 21361.555495262146, "eta": "5:56:01", "timestamp": 1765125490.4922187} +{"step": 2070, "loss": 4.599917888641357, "lr": 0.0005813850702828826, "time_ms": 2690.3960704803467, "eta_seconds": 21334.84083890915, "eta": "5:55:34", "timestamp": 1765125517.3989065} +{"step": 2080, "loss": 4.605347633361816, "lr": 0.0005810396511898279, "time_ms": 2691.009044647217, "eta_seconds": 21312.791633605957, "eta": "5:55:12", "timestamp": 1765125544.3032367} +{"step": 2090, "loss": 4.479176044464111, "lr": 0.0005806911732578466, "time_ms": 2689.573287963867, "eta_seconds": 21274.52470779419, "eta": "5:54:34", "timestamp": 1765125571.2084024} +{"step": 2100, "loss": 4.454916000366211, "lr": 0.0005803396407330325, "time_ms": 2689.7099018096924, "eta_seconds": 21248.70822429657, "eta": "5:54:08", "timestamp": 1765125598.1150725} +{"step": 2110, "loss": 4.535158634185791, "lr": 0.0005799850578986985, "time_ms": 2690.4802322387695, "eta_seconds": 21227.88903236389, "eta": "5:53:47", "timestamp": 1765125625.0211976} +{"step": 2120, "loss": 4.365918159484863, "lr": 0.0005796274290753245, "time_ms": 2690.9713745117188, "eta_seconds": 21204.854431152344, "eta": "5:53:24", "timestamp": 1765125651.9288116} +{"step": 2130, "loss": 4.53456449508667, "lr": 0.0005792667586205048, "time_ms": 2689.976215362549, "eta_seconds": 21170.11281490326, "eta": "5:52:50", "timestamp": 1765125678.835993} +{"step": 2140, "loss": 4.418206214904785, "lr": 0.0005789030509288951, "time_ms": 2690.8910274505615, "eta_seconds": 21150.403475761414, "eta": "5:52:30", "timestamp": 1765125705.745704} +{"step": 2150, "loss": 4.566821575164795, "lr": 0.0005785363104321589, "time_ms": 2690.556526184082, "eta_seconds": 21120.868730545044, "eta": "5:52:00", "timestamp": 1765125732.6561654} +{"step": 2160, "loss": 4.390469551086426, "lr": 0.0005781665415989133, "time_ms": 2690.2236938476562, "eta_seconds": 21091.353759765625, "eta": "5:51:31", "timestamp": 1765125759.5646899} +{"step": 2170, "loss": 4.507580757141113, "lr": 0.0005777937489346749, "time_ms": 2690.2124881744385, "eta_seconds": 21064.363782405853, "eta": "5:51:04", "timestamp": 1765125786.474586} +{"step": 2180, "loss": 4.589878082275391, "lr": 0.0005774179369818046, "time_ms": 2689.869165420532, "eta_seconds": 21034.776873588562, "eta": "5:50:34", "timestamp": 1765125813.3824818} +{"step": 2190, "loss": 4.266302108764648, "lr": 0.0005770391103194527, "time_ms": 2691.129684448242, "eta_seconds": 21017.72283554077, "eta": "5:50:17", "timestamp": 1765125840.2913141} +{"step": 2200, "loss": 4.3395514488220215, "lr": 0.0005766572735635022, "time_ms": 2690.476179122925, "eta_seconds": 20985.714197158813, "eta": "5:49:45", "timestamp": 1765125867.2005522} +{"step": 2210, "loss": 4.426790237426758, "lr": 0.0005762724313665137, "time_ms": 2690.4196739196777, "eta_seconds": 20958.36925983429, "eta": "5:49:18", "timestamp": 1765125894.1072028} +{"step": 2220, "loss": 4.375397682189941, "lr": 0.0005758845884176677, "time_ms": 2687.8440380096436, "eta_seconds": 20911.426615715027, "eta": "5:48:31", "timestamp": 1765125921.0094993} +{"step": 2230, "loss": 4.407618999481201, "lr": 0.0005754937494427085, "time_ms": 2690.1652812957764, "eta_seconds": 20902.584235668182, "eta": "5:48:22", "timestamp": 1765125947.9058745} +{"step": 2240, "loss": 4.4002604484558105, "lr": 0.0005750999192038853, "time_ms": 2689.9304389953613, "eta_seconds": 20873.860206604004, "eta": "5:47:53", "timestamp": 1765125974.8076124} +{"step": 2250, "loss": 4.357213020324707, "lr": 0.0005747031024998955, "time_ms": 2691.0219192504883, "eta_seconds": 20855.419874191284, "eta": "5:47:35", "timestamp": 1765126001.7128844} +{"step": 2260, "loss": 4.385488510131836, "lr": 0.0005743033041658252, "time_ms": 2689.8229122161865, "eta_seconds": 20819.229340553284, "eta": "5:46:59", "timestamp": 1765126028.6218252} +{"step": 2270, "loss": 4.211174011230469, "lr": 0.0005739005290730912, "time_ms": 2690.2060508728027, "eta_seconds": 20795.292773246765, "eta": "5:46:35", "timestamp": 1765126055.5306375} +{"step": 2280, "loss": 4.26361608505249, "lr": 0.0005734947821293807, "time_ms": 2690.3045177459717, "eta_seconds": 20769.1508769989, "eta": "5:46:09", "timestamp": 1765126082.4353797} +{"step": 2290, "loss": 4.374439239501953, "lr": 0.0005730860682785922, "time_ms": 2689.531087875366, "eta_seconds": 20736.284687519073, "eta": "5:45:36", "timestamp": 1765126109.3330204} +{"step": 2300, "loss": 4.300197601318359, "lr": 0.0005726743925007751, "time_ms": 2689.82195854187, "eta_seconds": 20711.6290807724, "eta": "5:45:11", "timestamp": 1765126136.235796} +{"step": 2310, "loss": 4.312472343444824, "lr": 0.0005722597598120686, "time_ms": 2689.9495124816895, "eta_seconds": 20685.711750984192, "eta": "5:44:45", "timestamp": 1765126163.1423688} +{"step": 2320, "loss": 4.192580699920654, "lr": 0.0005718421752646415, "time_ms": 2690.129041671753, "eta_seconds": 20660.191040039062, "eta": "5:44:20", "timestamp": 1765126190.0492797} +{"step": 2330, "loss": 4.325389385223389, "lr": 0.0005714216439466293, "time_ms": 2690.5901432037354, "eta_seconds": 20636.82639837265, "eta": "5:43:56", "timestamp": 1765126216.9522762} +{"step": 2340, "loss": 4.199782371520996, "lr": 0.0005709981709820738, "time_ms": 2691.1561489105225, "eta_seconds": 20614.256100654602, "eta": "5:43:34", "timestamp": 1765126243.858165} +{"step": 2350, "loss": 4.398078441619873, "lr": 0.0005705717615308593, "time_ms": 2690.3462409973145, "eta_seconds": 20581.148743629456, "eta": "5:43:01", "timestamp": 1765126270.7665648} +{"step": 2360, "loss": 4.266849040985107, "lr": 0.0005701424207886503, "time_ms": 2690.908432006836, "eta_seconds": 20558.540420532227, "eta": "5:42:38", "timestamp": 1765126297.6729064} +{"step": 2370, "loss": 4.241163730621338, "lr": 0.0005697101539868282, "time_ms": 2689.2433166503906, "eta_seconds": 20518.92650604248, "eta": "5:41:58", "timestamp": 1765126324.5771458} +{"step": 2380, "loss": 4.255152702331543, "lr": 0.0005692749663924279, "time_ms": 2689.1720294952393, "eta_seconds": 20491.490864753723, "eta": "5:41:31", "timestamp": 1765126351.4782057} +{"step": 2390, "loss": 4.332055568695068, "lr": 0.0005688368633080726, "time_ms": 2690.3936862945557, "eta_seconds": 20473.89595270157, "eta": "5:41:13", "timestamp": 1765126378.3846211} +{"step": 2400, "loss": 4.1553144454956055, "lr": 0.0005683958500719103, "time_ms": 2690.2198791503906, "eta_seconds": 20445.67108154297, "eta": "5:40:45", "timestamp": 1765126405.293487} +{"step": 2410, "loss": 4.2826337814331055, "lr": 0.0005679519320575478, "time_ms": 2690.4358863830566, "eta_seconds": 20420.4083776474, "eta": "5:40:20", "timestamp": 1765126432.2031183} +{"step": 2420, "loss": 4.268885135650635, "lr": 0.0005675051146739864, "time_ms": 2690.762758255005, "eta_seconds": 20395.981707572937, "eta": "5:39:55", "timestamp": 1765126459.1112068} +{"step": 2430, "loss": 4.088177680969238, "lr": 0.0005670554033655546, "time_ms": 2690.8140182495117, "eta_seconds": 20369.462118148804, "eta": "5:39:29", "timestamp": 1765126486.0194724} +{"step": 2440, "loss": 4.099613189697266, "lr": 0.0005666028036118431, "time_ms": 2689.9240016937256, "eta_seconds": 20335.825452804565, "eta": "5:38:55", "timestamp": 1765126512.9303691} +{"step": 2450, "loss": 4.151208400726318, "lr": 0.0005661473209276368, "time_ms": 2689.809560775757, "eta_seconds": 20308.062183856964, "eta": "5:38:28", "timestamp": 1765126539.839847} +{"step": 2460, "loss": 4.239109992980957, "lr": 0.0005656889608628486, "time_ms": 2690.2008056640625, "eta_seconds": 20284.11407470703, "eta": "5:38:04", "timestamp": 1765126566.7486277} +{"step": 2470, "loss": 4.3467254638671875, "lr": 0.0005652277290024511, "time_ms": 2690.450668334961, "eta_seconds": 20259.093532562256, "eta": "5:37:39", "timestamp": 1765126593.6602314} +{"step": 2480, "loss": 4.293366432189941, "lr": 0.0005647636309664091, "time_ms": 2690.796375274658, "eta_seconds": 20234.78874206543, "eta": "5:37:14", "timestamp": 1765126620.5699527} +{"step": 2490, "loss": 4.197343349456787, "lr": 0.0005642966724096107, "time_ms": 2690.587282180786, "eta_seconds": 20206.310489177704, "eta": "5:36:46", "timestamp": 1765126647.4782596} +{"step": 2500, "loss": 4.296971321105957, "lr": 0.0005638268590217985, "time_ms": 52553.4873008728, "eta_seconds": 394151.154756546, "eta": "4 days, 13:29:11", "timestamp": 1765126724.2491896} +{"step": 2510, "loss": 4.135358810424805, "lr": 0.0005633541965275003, "time_ms": 2689.624071121216, "eta_seconds": 20145.284292697906, "eta": "5:35:45", "timestamp": 1765126751.1419098} +{"step": 2520, "loss": 4.316387176513672, "lr": 0.0005628786906859594, "time_ms": 2689.6157264709473, "eta_seconds": 20118.325634002686, "eta": "5:35:18", "timestamp": 1765126778.0439022} +{"step": 2530, "loss": 4.216681003570557, "lr": 0.0005624003472910647, "time_ms": 2689.8193359375, "eta_seconds": 20092.950439453125, "eta": "5:34:52", "timestamp": 1765126804.9449728} +{"step": 2540, "loss": 4.244337558746338, "lr": 0.0005619191721712793, "time_ms": 2690.295696258545, "eta_seconds": 20069.605894088745, "eta": "5:34:29", "timestamp": 1765126831.8450868} +{"step": 2550, "loss": 4.260036945343018, "lr": 0.0005614351711895703, "time_ms": 2689.5980834960938, "eta_seconds": 20037.5057220459, "eta": "5:33:57", "timestamp": 1765126858.7492669} +{"step": 2560, "loss": 4.126336097717285, "lr": 0.0005609483502433367, "time_ms": 2688.1139278411865, "eta_seconds": 19999.567623138428, "eta": "5:33:19", "timestamp": 1765126885.6556203} +{"step": 2570, "loss": 4.224637031555176, "lr": 0.0005604587152643383, "time_ms": 2690.8390522003174, "eta_seconds": 19992.934157848358, "eta": "5:33:12", "timestamp": 1765126912.562684} +{"step": 2580, "loss": 4.080143928527832, "lr": 0.0005599662722186228, "time_ms": 2690.1113986968994, "eta_seconds": 19960.626578330994, "eta": "5:32:40", "timestamp": 1765126939.4688787} +{"step": 2590, "loss": 4.1858744621276855, "lr": 0.0005594710271064532, "time_ms": 2690.446138381958, "eta_seconds": 19936.20588541031, "eta": "5:32:16", "timestamp": 1765126966.372455} +{"step": 2600, "loss": 4.12255334854126, "lr": 0.000558972985962235, "time_ms": 2690.150022506714, "eta_seconds": 19907.110166549683, "eta": "5:31:47", "timestamp": 1765126993.2804158} +{"step": 2610, "loss": 4.162102222442627, "lr": 0.0005584721548544423, "time_ms": 2689.9726390838623, "eta_seconds": 19878.897802829742, "eta": "5:31:18", "timestamp": 1765127020.1878376} +{"step": 2620, "loss": 4.15994930267334, "lr": 0.000557968539885544, "time_ms": 2689.91756439209, "eta_seconds": 19851.591625213623, "eta": "5:30:51", "timestamp": 1765127047.0940373} +{"step": 2630, "loss": 4.2518439292907715, "lr": 0.0005574621471919298, "time_ms": 2689.6262168884277, "eta_seconds": 19822.545218467712, "eta": "5:30:22", "timestamp": 1765127074.0009618} +{"step": 2640, "loss": 4.237005710601807, "lr": 0.0005569529829438347, "time_ms": 2690.3488636016846, "eta_seconds": 19800.9676361084, "eta": "5:30:00", "timestamp": 1765127100.9071944} +{"step": 2650, "loss": 4.076812267303467, "lr": 0.0005564410533452645, "time_ms": 2690.171241760254, "eta_seconds": 19772.758626937866, "eta": "5:29:32", "timestamp": 1765127127.814129} +{"step": 2660, "loss": 4.123446941375732, "lr": 0.0005559263646339196, "time_ms": 2690.8321380615234, "eta_seconds": 19750.707893371582, "eta": "5:29:10", "timestamp": 1765127154.7196994} +{"step": 2670, "loss": 4.2257304191589355, "lr": 0.0005554089230811196, "time_ms": 2690.2596950531006, "eta_seconds": 19719.603564739227, "eta": "5:28:39", "timestamp": 1765127181.6270843} +{"step": 2680, "loss": 4.2654595375061035, "lr": 0.0005548887349917268, "time_ms": 2689.8653507232666, "eta_seconds": 19689.81436729431, "eta": "5:28:09", "timestamp": 1765127208.5337183} +{"step": 2690, "loss": 4.150134563446045, "lr": 0.0005543658067040686, "time_ms": 2690.356492996216, "eta_seconds": 19666.505963802338, "eta": "5:27:46", "timestamp": 1765127235.4411314} +{"step": 2700, "loss": 4.002840995788574, "lr": 0.0005538401445898612, "time_ms": 2689.786672592163, "eta_seconds": 19635.44270992279, "eta": "5:27:15", "timestamp": 1765127262.3470697} +{"step": 2710, "loss": 4.203924655914307, "lr": 0.0005533117550541316, "time_ms": 2690.798759460449, "eta_seconds": 19615.922956466675, "eta": "5:26:55", "timestamp": 1765127289.2560287} +{"step": 2720, "loss": 4.096187114715576, "lr": 0.0005527806445351397, "time_ms": 2690.5291080474854, "eta_seconds": 19587.051906585693, "eta": "5:26:27", "timestamp": 1765127316.1668358} +{"step": 2730, "loss": 4.064530372619629, "lr": 0.0005522468195042993, "time_ms": 2690.0041103363037, "eta_seconds": 19556.329882144928, "eta": "5:25:56", "timestamp": 1765127343.0745533} +{"step": 2740, "loss": 4.076711654663086, "lr": 0.0005517102864661, "time_ms": 2690.5598640441895, "eta_seconds": 19533.464612960815, "eta": "5:25:33", "timestamp": 1765127369.9824014} +{"step": 2750, "loss": 3.985109567642212, "lr": 0.0005511710519580278, "time_ms": 2690.6137466430664, "eta_seconds": 19506.94966316223, "eta": "5:25:06", "timestamp": 1765127396.8902667} +{"step": 2760, "loss": 3.960557699203491, "lr": 0.0005506291225504846, "time_ms": 2691.5478706359863, "eta_seconds": 19486.80658340454, "eta": "5:24:46", "timestamp": 1765127423.8025396} +{"step": 2770, "loss": 4.104734897613525, "lr": 0.0005500845048467095, "time_ms": 2691.075086593628, "eta_seconds": 19456.47287607193, "eta": "5:24:16", "timestamp": 1765127450.7109065} +{"step": 2780, "loss": 4.028797626495361, "lr": 0.0005495372054826974, "time_ms": 2690.6254291534424, "eta_seconds": 19426.315598487854, "eta": "5:23:46", "timestamp": 1765127477.6162007} +{"step": 2790, "loss": 4.151330471038818, "lr": 0.0005489872311271181, "time_ms": 2690.7670497894287, "eta_seconds": 19400.43042898178, "eta": "5:23:20", "timestamp": 1765127504.5236785} +{"step": 2800, "loss": 4.19321870803833, "lr": 0.0005484345884812357, "time_ms": 2689.359426498413, "eta_seconds": 19363.387870788574, "eta": "5:22:43", "timestamp": 1765127531.4266105} +{"step": 2810, "loss": 4.017468452453613, "lr": 0.0005478792842788265, "time_ms": 2689.9585723876953, "eta_seconds": 19340.80213546753, "eta": "5:22:20", "timestamp": 1765127558.3298373} +{"step": 2820, "loss": 4.067428112030029, "lr": 0.0005473213252860967, "time_ms": 2689.1391277313232, "eta_seconds": 19308.0189371109, "eta": "5:21:48", "timestamp": 1765127585.2348807} +{"step": 2830, "loss": 4.087689399719238, "lr": 0.0005467607183016009, "time_ms": 2690.92059135437, "eta_seconds": 19293.900640010834, "eta": "5:21:33", "timestamp": 1765127612.1390598} +{"step": 2840, "loss": 3.9702937602996826, "lr": 0.0005461974701561579, "time_ms": 2690.3679370880127, "eta_seconds": 19263.03442955017, "eta": "5:21:03", "timestamp": 1765127639.0449328} +{"step": 2850, "loss": 3.947720766067505, "lr": 0.000545631587712769, "time_ms": 2689.7547245025635, "eta_seconds": 19231.74628019333, "eta": "5:20:31", "timestamp": 1765127665.9490354} +{"step": 2860, "loss": 4.169245719909668, "lr": 0.0005450630778665329, "time_ms": 2688.1062984466553, "eta_seconds": 19193.07897090912, "eta": "5:19:53", "timestamp": 1765127692.853152} +{"step": 2870, "loss": 3.9979748725891113, "lr": 0.0005444919475445628, "time_ms": 2689.281225204468, "eta_seconds": 19174.575135707855, "eta": "5:19:34", "timestamp": 1765127719.7467926} +{"step": 2880, "loss": 4.091871738433838, "lr": 0.0005439182037059014, "time_ms": 2688.748598098755, "eta_seconds": 19143.890018463135, "eta": "5:19:03", "timestamp": 1765127746.637782} +{"step": 2890, "loss": 4.044551849365234, "lr": 0.0005433418533414364, "time_ms": 2688.985586166382, "eta_seconds": 19118.687517642975, "eta": "5:18:38", "timestamp": 1765127773.5257905} +{"step": 2900, "loss": 4.0237531661987305, "lr": 0.0005427629034738148, "time_ms": 2689.1918182373047, "eta_seconds": 19093.261909484863, "eta": "5:18:13", "timestamp": 1765127800.4230397} +{"step": 2910, "loss": 4.022540092468262, "lr": 0.0005421813611573584, "time_ms": 2689.523458480835, "eta_seconds": 19068.72132062912, "eta": "5:17:48", "timestamp": 1765127827.325521} +{"step": 2920, "loss": 4.0796966552734375, "lr": 0.0005415972334779766, "time_ms": 2689.5859241485596, "eta_seconds": 19042.2683429718, "eta": "5:17:22", "timestamp": 1765127854.2275474} +{"step": 2930, "loss": 4.140377998352051, "lr": 0.0005410105275530809, "time_ms": 2689.663887023926, "eta_seconds": 19015.923681259155, "eta": "5:16:55", "timestamp": 1765127881.1273344} +{"step": 2940, "loss": 4.096635341644287, "lr": 0.000540421250531498, "time_ms": 2688.3959770202637, "eta_seconds": 18980.07559776306, "eta": "5:16:20", "timestamp": 1765127908.0247056} +{"step": 2950, "loss": 4.015339374542236, "lr": 0.000539829409593382, "time_ms": 2689.177989959717, "eta_seconds": 18958.704829216003, "eta": "5:15:58", "timestamp": 1765127934.927474} +{"step": 2960, "loss": 3.9845633506774902, "lr": 0.0005392350119501284, "time_ms": 2689.8226737976074, "eta_seconds": 18936.351623535156, "eta": "5:15:36", "timestamp": 1765127961.829623} +{"step": 2970, "loss": 4.127829551696777, "lr": 0.0005386380648442847, "time_ms": 2690.2408599853516, "eta_seconds": 18912.39324569702, "eta": "5:15:12", "timestamp": 1765127988.7335098} +{"step": 2980, "loss": 4.111495494842529, "lr": 0.000538038575549463, "time_ms": 2689.850330352783, "eta_seconds": 18882.749319076538, "eta": "5:14:42", "timestamp": 1765128015.6368856} +{"step": 2990, "loss": 4.0937700271606445, "lr": 0.0005374365513702513, "time_ms": 2690.776586532593, "eta_seconds": 18862.343871593475, "eta": "5:14:22", "timestamp": 1765128042.543037} +{"step": 3000, "loss": 4.116408348083496, "lr": 0.0005368319996421239, "time_ms": 52531.426191329956, "eta_seconds": 367719.9833393097, "eta": "4 days, 6:08:39", "timestamp": 1765128119.289973} +{"step": 3010, "loss": 3.884317636489868, "lr": 0.0005362249277313534, "time_ms": 2690.204620361328, "eta_seconds": 18804.530296325684, "eta": "5:13:24", "timestamp": 1765128146.178417} +{"step": 3020, "loss": 3.8064355850219727, "lr": 0.0005356153430349189, "time_ms": 2691.070556640625, "eta_seconds": 18783.672485351562, "eta": "5:13:03", "timestamp": 1765128173.0814645} +{"step": 3030, "loss": 4.011989593505859, "lr": 0.0005350032529804177, "time_ms": 2690.1073455810547, "eta_seconds": 18750.04819869995, "eta": "5:12:30", "timestamp": 1765128199.987558} +{"step": 3040, "loss": 4.0624775886535645, "lr": 0.0005343886650259742, "time_ms": 2690.150022506714, "eta_seconds": 18723.44415664673, "eta": "5:12:03", "timestamp": 1765128226.8973207} +{"step": 3050, "loss": 3.912344455718994, "lr": 0.0005337715866601484, "time_ms": 2689.861059188843, "eta_seconds": 18694.534361362457, "eta": "5:11:34", "timestamp": 1765128253.80528} +{"step": 3060, "loss": 3.9372787475585938, "lr": 0.0005331520254018455, "time_ms": 2690.429449081421, "eta_seconds": 18671.58037662506, "eta": "5:11:11", "timestamp": 1765128280.7161987} +{"step": 3070, "loss": 3.936131477355957, "lr": 0.000532529988800224, "time_ms": 2690.486192703247, "eta_seconds": 18645.069315433502, "eta": "5:10:45", "timestamp": 1765128307.6262288} +{"step": 3080, "loss": 4.109328746795654, "lr": 0.0005319054844346036, "time_ms": 2690.4900074005127, "eta_seconds": 18618.190851211548, "eta": "5:10:18", "timestamp": 1765128334.5378642} +{"step": 3090, "loss": 3.9433798789978027, "lr": 0.0005312785199143727, "time_ms": 2691.366672515869, "eta_seconds": 18597.343707084656, "eta": "5:09:57", "timestamp": 1765128361.4491725} +{"step": 3100, "loss": 3.9203379154205322, "lr": 0.0005306491028788964, "time_ms": 2690.842390060425, "eta_seconds": 18566.81249141693, "eta": "5:09:26", "timestamp": 1765128388.359095} +{"step": 3110, "loss": 3.89469051361084, "lr": 0.0005300172409974225, "time_ms": 2690.556526184082, "eta_seconds": 18537.934465408325, "eta": "5:08:57", "timestamp": 1765128415.2691553} +{"step": 3120, "loss": 3.9375972747802734, "lr": 0.0005293829419689886, "time_ms": 2690.3955936431885, "eta_seconds": 18509.921684265137, "eta": "5:08:29", "timestamp": 1765128442.179723} +{"step": 3130, "loss": 4.031548500061035, "lr": 0.0005287462135223283, "time_ms": 2690.8974647521973, "eta_seconds": 18486.465582847595, "eta": "5:08:06", "timestamp": 1765128469.0917287} +{"step": 3140, "loss": 3.8996360301971436, "lr": 0.0005281070634157765, "time_ms": 2690.401554107666, "eta_seconds": 18456.15466117859, "eta": "5:07:36", "timestamp": 1765128496.0038025} +{"step": 3150, "loss": 3.944692850112915, "lr": 0.0005274654994371759, "time_ms": 2691.554069519043, "eta_seconds": 18437.145376205444, "eta": "5:07:17", "timestamp": 1765128522.9183633} +{"step": 3160, "loss": 3.861314296722412, "lr": 0.000526821529403781, "time_ms": 2690.486192703247, "eta_seconds": 18402.92555809021, "eta": "5:06:42", "timestamp": 1765128549.8272362} +{"step": 3170, "loss": 3.936054229736328, "lr": 0.0005261751611621634, "time_ms": 2690.5429363250732, "eta_seconds": 18376.40825510025, "eta": "5:06:16", "timestamp": 1765128576.7379897} +{"step": 3180, "loss": 3.851860761642456, "lr": 0.0005255264025881162, "time_ms": 2690.8438205718994, "eta_seconds": 18351.554856300354, "eta": "5:05:51", "timestamp": 1765128603.6481318} +{"step": 3190, "loss": 4.107852458953857, "lr": 0.0005248752615865577, "time_ms": 2690.609931945801, "eta_seconds": 18323.053636550903, "eta": "5:05:23", "timestamp": 1765128630.55844} +{"step": 3200, "loss": 3.9359970092773438, "lr": 0.0005242217460914358, "time_ms": 2689.9654865264893, "eta_seconds": 18291.765308380127, "eta": "5:04:51", "timestamp": 1765128657.4701886} +{"step": 3210, "loss": 3.8516530990600586, "lr": 0.0005235658640656303, "time_ms": 2691.166877746582, "eta_seconds": 18273.023099899292, "eta": "5:04:33", "timestamp": 1765128684.383935} +{"step": 3220, "loss": 4.065548419952393, "lr": 0.0005229076235008568, "time_ms": 2690.20938873291, "eta_seconds": 18239.61965560913, "eta": "5:03:59", "timestamp": 1765128711.2960458} +{"step": 3230, "loss": 3.8050742149353027, "lr": 0.000522247032417569, "time_ms": 2691.5481090545654, "eta_seconds": 18221.780698299408, "eta": "5:03:41", "timestamp": 1765128738.2080526} +{"step": 3240, "loss": 3.840873956680298, "lr": 0.0005215840988648606, "time_ms": 2690.934658050537, "eta_seconds": 18190.71828842163, "eta": "5:03:10", "timestamp": 1765128765.1179721} +{"step": 3250, "loss": 3.9182777404785156, "lr": 0.0005209188309203678, "time_ms": 2690.6046867370605, "eta_seconds": 18161.58163547516, "eta": "5:02:41", "timestamp": 1765128792.0268388} +{"step": 3260, "loss": 3.9248995780944824, "lr": 0.0005202512366901705, "time_ms": 2690.931558609009, "eta_seconds": 18136.87870502472, "eta": "5:02:16", "timestamp": 1765128818.9371612} +{"step": 3270, "loss": 3.920917272567749, "lr": 0.0005195813243086938, "time_ms": 2690.534830093384, "eta_seconds": 18107.299406528473, "eta": "5:01:47", "timestamp": 1765128845.8472393} +{"step": 3280, "loss": 3.8486971855163574, "lr": 0.0005189091019386086, "time_ms": 2690.969228744507, "eta_seconds": 18083.313217163086, "eta": "5:01:23", "timestamp": 1765128872.7554972} +{"step": 3290, "loss": 3.7571070194244385, "lr": 0.0005182345777707324, "time_ms": 2690.6614303588867, "eta_seconds": 18054.33819770813, "eta": "5:00:54", "timestamp": 1765128899.6661465} +{"step": 3300, "loss": 3.8062729835510254, "lr": 0.0005175577600239292, "time_ms": 2690.9637451171875, "eta_seconds": 18029.457092285156, "eta": "5:00:29", "timestamp": 1765128926.574064} +{"step": 3310, "loss": 3.8404393196105957, "lr": 0.0005168786569450098, "time_ms": 2690.279006958008, "eta_seconds": 17997.966556549072, "eta": "4:59:57", "timestamp": 1765128953.4806604} +{"step": 3320, "loss": 3.783167839050293, "lr": 0.0005161972768086307, "time_ms": 2691.2646293640137, "eta_seconds": 17977.64772415161, "eta": "4:59:37", "timestamp": 1765128980.3903763} +{"step": 3330, "loss": 3.9795150756835938, "lr": 0.0005155136279171941, "time_ms": 2690.1021003723145, "eta_seconds": 17942.981009483337, "eta": "4:59:02", "timestamp": 1765129007.3016863} +{"step": 3340, "loss": 3.8668627738952637, "lr": 0.0005148277186007459, "time_ms": 2690.272331237793, "eta_seconds": 17917.2137260437, "eta": "4:58:37", "timestamp": 1765129034.2122235} +{"step": 3350, "loss": 4.01901912689209, "lr": 0.0005141395572168746, "time_ms": 2690.6771659851074, "eta_seconds": 17893.003153800964, "eta": "4:58:13", "timestamp": 1765129061.1224625} +{"step": 3360, "loss": 3.829000234603882, "lr": 0.0005134491521506094, "time_ms": 2690.5136108398438, "eta_seconds": 17865.010375976562, "eta": "4:57:45", "timestamp": 1765129088.0342066} +{"step": 3370, "loss": 3.866755962371826, "lr": 0.0005127565118143183, "time_ms": 2691.81752204895, "eta_seconds": 17846.75017118454, "eta": "4:57:26", "timestamp": 1765129114.9443855} +{"step": 3380, "loss": 4.0187602043151855, "lr": 0.0005120616446476052, "time_ms": 2691.0533905029297, "eta_seconds": 17814.773445129395, "eta": "4:56:54", "timestamp": 1765129141.8544538} +{"step": 3390, "loss": 3.8270366191864014, "lr": 0.0005113645591172073, "time_ms": 2690.3955936431885, "eta_seconds": 17783.514873981476, "eta": "4:56:23", "timestamp": 1765129168.7613227} +{"step": 3400, "loss": 3.699831008911133, "lr": 0.0005106652637168916, "time_ms": 2690.246105194092, "eta_seconds": 17755.624294281006, "eta": "4:55:55", "timestamp": 1765129195.6692035} +{"step": 3410, "loss": 3.8173210620880127, "lr": 0.000509963766967352, "time_ms": 2689.948320388794, "eta_seconds": 17726.759431362152, "eta": "4:55:26", "timestamp": 1765129222.5758166} +{"step": 3420, "loss": 3.877948522567749, "lr": 0.0005092600774161052, "time_ms": 2690.767288208008, "eta_seconds": 17705.24875640869, "eta": "4:55:05", "timestamp": 1765129249.48574} +{"step": 3430, "loss": 3.9030673503875732, "lr": 0.000508554203637386, "time_ms": 2690.8321380615234, "eta_seconds": 17678.76714706421, "eta": "4:54:38", "timestamp": 1765129276.39221} +{"step": 3440, "loss": 3.750906229019165, "lr": 0.0005078461542320436, "time_ms": 2689.9001598358154, "eta_seconds": 17645.74504852295, "eta": "4:54:05", "timestamp": 1765129303.2987702} +{"step": 3450, "loss": 3.7287631034851074, "lr": 0.0005071359378274369, "time_ms": 2690.302848815918, "eta_seconds": 17621.483659744263, "eta": "4:53:41", "timestamp": 1765129330.204738} +{"step": 3460, "loss": 3.9097394943237305, "lr": 0.0005064235630773285, "time_ms": 2689.9290084838867, "eta_seconds": 17592.13571548462, "eta": "4:53:12", "timestamp": 1765129357.110886} +{"step": 3470, "loss": 3.604060173034668, "lr": 0.0005057090386617796, "time_ms": 2690.5386447906494, "eta_seconds": 17569.21735048294, "eta": "4:52:49", "timestamp": 1765129384.019443} +{"step": 3480, "loss": 3.7080392837524414, "lr": 0.0005049923732870453, "time_ms": 2691.5316581726074, "eta_seconds": 17548.7864112854, "eta": "4:52:28", "timestamp": 1765129410.9314084} +{"step": 3490, "loss": 3.9106361865997314, "lr": 0.0005042735756854666, "time_ms": 2690.3491020202637, "eta_seconds": 17514.172654151917, "eta": "4:51:54", "timestamp": 1765129437.841807} +{"step": 3500, "loss": 3.8377413749694824, "lr": 0.0005035526546153655, "time_ms": 52734.42816734314, "eta_seconds": 342773.7830877304, "eta": "3 days, 23:12:53", "timestamp": 1765129514.792843} +{"step": 3510, "loss": 3.8816070556640625, "lr": 0.000502829618860938, "time_ms": 2686.624050140381, "eta_seconds": 17436.19008541107, "eta": "4:50:36", "timestamp": 1765129541.6629987} +{"step": 3520, "loss": 3.789853096008301, "lr": 0.0005021044772321461, "time_ms": 2688.7776851654053, "eta_seconds": 17423.279399871826, "eta": "4:50:23", "timestamp": 1765129568.5453608} +{"step": 3530, "loss": 3.931692600250244, "lr": 0.0005013772385646122, "time_ms": 2687.7686977386475, "eta_seconds": 17389.86347436905, "eta": "4:49:49", "timestamp": 1765129595.4246185} +{"step": 3540, "loss": 3.920625686645508, "lr": 0.0005006479117195097, "time_ms": 2689.38946723938, "eta_seconds": 17373.455958366394, "eta": "4:49:33", "timestamp": 1765129622.3114967} +{"step": 3550, "loss": 3.8381471633911133, "lr": 0.0004999165055834561, "time_ms": 2687.351703643799, "eta_seconds": 17333.418488502502, "eta": "4:48:53", "timestamp": 1765129649.194024} +{"step": 3560, "loss": 3.7834129333496094, "lr": 0.0004991830290684043, "time_ms": 2687.3648166656494, "eta_seconds": 17306.629419326782, "eta": "4:48:26", "timestamp": 1765129676.0808578} +{"step": 3570, "loss": 3.8798818588256836, "lr": 0.0004984474911115342, "time_ms": 2688.4655952453613, "eta_seconds": 17286.833777427673, "eta": "4:48:06", "timestamp": 1765129702.9649935} +{"step": 3580, "loss": 3.758981943130493, "lr": 0.0004977099006751437, "time_ms": 2688.0064010620117, "eta_seconds": 17257.001094818115, "eta": "4:47:37", "timestamp": 1765129729.8516288} +{"step": 3590, "loss": 3.92991304397583, "lr": 0.0004969702667465396, "time_ms": 2688.3788108825684, "eta_seconds": 17232.508177757263, "eta": "4:47:12", "timestamp": 1765129756.7380493} +{"step": 3600, "loss": 3.879608392715454, "lr": 0.0004962285983379276, "time_ms": 2688.159227371216, "eta_seconds": 17204.21905517578, "eta": "4:46:44", "timestamp": 1765129783.622691} +{"step": 3610, "loss": 3.8458781242370605, "lr": 0.0004954849044863036, "time_ms": 2688.5006427764893, "eta_seconds": 17179.519107341766, "eta": "4:46:19", "timestamp": 1765129810.505242} +{"step": 3620, "loss": 3.772733688354492, "lr": 0.0004947391942533423, "time_ms": 2688.014030456543, "eta_seconds": 17149.529514312744, "eta": "4:45:49", "timestamp": 1765129837.391187} +{"step": 3630, "loss": 3.883812189102173, "lr": 0.0004939914767252873, "time_ms": 2688.0874633789062, "eta_seconds": 17123.117141723633, "eta": "4:45:23", "timestamp": 1765129864.278447} +{"step": 3640, "loss": 3.8938052654266357, "lr": 0.0004932417610128412, "time_ms": 2688.232898712158, "eta_seconds": 17097.161235809326, "eta": "4:44:57", "timestamp": 1765129891.166211} +{"step": 3650, "loss": 3.8687994480133057, "lr": 0.000492490056251053, "time_ms": 2688.1511211395264, "eta_seconds": 17069.759619235992, "eta": "4:44:29", "timestamp": 1765129918.0536494} +{"step": 3660, "loss": 3.907830238342285, "lr": 0.0004917363715992081, "time_ms": 2688.6534690856934, "eta_seconds": 17046.062994003296, "eta": "4:44:06", "timestamp": 1765129944.9425693} +{"step": 3670, "loss": 3.765756368637085, "lr": 0.0004909807162407162, "time_ms": 2688.5933876037598, "eta_seconds": 17018.7961435318, "eta": "4:43:38", "timestamp": 1765129971.8321393} +{"step": 3680, "loss": 3.8678083419799805, "lr": 0.0004902230993829994, "time_ms": 2689.563751220703, "eta_seconds": 16998.042907714844, "eta": "4:43:18", "timestamp": 1765129998.7210183} +{"step": 3690, "loss": 3.757514238357544, "lr": 0.0004894635302573798, "time_ms": 2690.014123916626, "eta_seconds": 16973.98912191391, "eta": "4:42:53", "timestamp": 1765130025.6112452} +{"step": 3700, "loss": 3.7789676189422607, "lr": 0.0004887020181189677, "time_ms": 2689.8536682128906, "eta_seconds": 16946.07810974121, "eta": "4:42:26", "timestamp": 1765130052.5030766} +{"step": 3710, "loss": 3.8415417671203613, "lr": 0.00048793857224654815, "time_ms": 2687.2308254241943, "eta_seconds": 16902.681891918182, "eta": "4:41:42", "timestamp": 1765130079.386646} +{"step": 3720, "loss": 3.922987222671509, "lr": 0.00048717320194246804, "time_ms": 2689.283609390259, "eta_seconds": 16888.701066970825, "eta": "4:41:28", "timestamp": 1765130106.2755945} +{"step": 3730, "loss": 3.81547212600708, "lr": 0.0004864059165325232, "time_ms": 2687.793016433716, "eta_seconds": 16852.4622130394, "eta": "4:40:52", "timestamp": 1765130133.1653953} +{"step": 3740, "loss": 3.841766119003296, "lr": 0.0004856367253658441, "time_ms": 2688.8935565948486, "eta_seconds": 16832.473664283752, "eta": "4:40:32", "timestamp": 1765130160.0561714} +{"step": 3750, "loss": 3.742861747741699, "lr": 0.00048486563781478234, "time_ms": 2688.0335807800293, "eta_seconds": 16800.209879875183, "eta": "4:40:00", "timestamp": 1765130186.9442732} +{"step": 3760, "loss": 3.6967756748199463, "lr": 0.00048409266327479656, "time_ms": 2688.798189163208, "eta_seconds": 16778.100700378418, "eta": "4:39:38", "timestamp": 1765130213.830113} +{"step": 3770, "loss": 3.9097487926483154, "lr": 0.0004833178111643373, "time_ms": 2684.7939491271973, "eta_seconds": 16726.26630306244, "eta": "4:38:46", "timestamp": 1765130240.691876} +{"step": 3780, "loss": 3.8741772174835205, "lr": 0.00048254109092473314, "time_ms": 2686.7287158966064, "eta_seconds": 16711.452612876892, "eta": "4:38:31", "timestamp": 1765130267.561478} +{"step": 3790, "loss": 3.5968289375305176, "lr": 0.00048176251202007516, "time_ms": 2688.1744861602783, "eta_seconds": 16693.56355905533, "eta": "4:38:13", "timestamp": 1765130294.442284} +{"step": 3800, "loss": 3.744539976119995, "lr": 0.00048098208393710154, "time_ms": 2688.5526180267334, "eta_seconds": 16669.026231765747, "eta": "4:37:49", "timestamp": 1765130321.3288825} +{"step": 3810, "loss": 3.8645899295806885, "lr": 0.00048019981618508225, "time_ms": 2688.638210296631, "eta_seconds": 16642.670521736145, "eta": "4:37:22", "timestamp": 1765130348.2159684} +{"step": 3820, "loss": 3.7573108673095703, "lr": 0.00047941571829570283, "time_ms": 2687.8883838653564, "eta_seconds": 16611.150212287903, "eta": "4:36:51", "timestamp": 1765130375.1043828} +{"step": 3830, "loss": 3.9844441413879395, "lr": 0.0004786297998229487, "time_ms": 2688.263416290283, "eta_seconds": 16586.585278511047, "eta": "4:36:26", "timestamp": 1765130401.995784} +{"step": 3840, "loss": 3.657184600830078, "lr": 0.0004778420703429885, "time_ms": 2688.392400741577, "eta_seconds": 16560.497188568115, "eta": "4:36:00", "timestamp": 1765130428.89026} +{"step": 3850, "loss": 3.8730812072753906, "lr": 0.00047705253945405727, "time_ms": 2689.157724380493, "eta_seconds": 16538.320004940033, "eta": "4:35:38", "timestamp": 1765130455.7793028} +{"step": 3860, "loss": 3.7259299755096436, "lr": 0.00047626121677633973, "time_ms": 2687.993288040161, "eta_seconds": 16504.27878856659, "eta": "4:35:04", "timestamp": 1765130482.6711287} +{"step": 3870, "loss": 3.71696138381958, "lr": 0.00047546811195185295, "time_ms": 2689.0079975128174, "eta_seconds": 16483.61902475357, "eta": "4:34:43", "timestamp": 1765130509.5642686} +{"step": 3880, "loss": 3.7578039169311523, "lr": 0.000474673234644329, "time_ms": 2687.19220161438, "eta_seconds": 16445.616273880005, "eta": "4:34:05", "timestamp": 1765130536.4559424} +{"step": 3890, "loss": 3.6949119567871094, "lr": 0.000473876594539097, "time_ms": 2688.5273456573486, "eta_seconds": 16426.9020819664, "eta": "4:33:46", "timestamp": 1765130563.3482184} +{"step": 3900, "loss": 3.7928380966186523, "lr": 0.00047307820134296524, "time_ms": 2688.438892364502, "eta_seconds": 16399.477243423462, "eta": "4:33:19", "timestamp": 1765130590.2388585} +{"step": 3910, "loss": 3.673444986343384, "lr": 0.0004722780647841029, "time_ms": 2689.2330646514893, "eta_seconds": 16377.42936372757, "eta": "4:32:57", "timestamp": 1765130617.1326568} +{"step": 3920, "loss": 3.717175006866455, "lr": 0.00047147619461192133, "time_ms": 2688.908576965332, "eta_seconds": 16348.564147949219, "eta": "4:32:28", "timestamp": 1765130644.0232968} +{"step": 3930, "loss": 3.8434865474700928, "lr": 0.0004706726005969556, "time_ms": 2689.1298294067383, "eta_seconds": 16323.018064498901, "eta": "4:32:03", "timestamp": 1765130670.9178512} +{"step": 3940, "loss": 3.8052213191986084, "lr": 0.0004698672925307451, "time_ms": 2689.1698837280273, "eta_seconds": 16296.369495391846, "eta": "4:31:36", "timestamp": 1765130697.8112268} +{"step": 3950, "loss": 3.7479493618011475, "lr": 0.0004690602802257146, "time_ms": 2688.249111175537, "eta_seconds": 16263.907122612, "eta": "4:31:03", "timestamp": 1765130724.7049644} +{"step": 3960, "loss": 3.8036913871765137, "lr": 0.0004682515735150542, "time_ms": 2688.788652420044, "eta_seconds": 16240.283460617065, "eta": "4:30:40", "timestamp": 1765130751.5984216} +{"step": 3970, "loss": 3.6737775802612305, "lr": 0.0004674411822526002, "time_ms": 2688.5671615600586, "eta_seconds": 16212.059984207153, "eta": "4:30:12", "timestamp": 1765130778.4926805} +{"step": 3980, "loss": 3.7850334644317627, "lr": 0.0004666291163127141, "time_ms": 2689.2993450164795, "eta_seconds": 16189.582056999207, "eta": "4:29:49", "timestamp": 1765130805.3844497} +{"step": 3990, "loss": 3.6875503063201904, "lr": 0.00046581538559016343, "time_ms": 2689.0602111816406, "eta_seconds": 16161.25186920166, "eta": "4:29:21", "timestamp": 1765130832.2753623} +{"step": 4000, "loss": 3.7642388343811035, "lr": 0.0004649999999999999, "time_ms": 52804.76784706116, "eta_seconds": 316828.60708236694, "eta": "3 days, 16:00:28", "timestamp": 1765130909.2864263} +{"step": 4010, "loss": 3.7570154666900635, "lr": 0.0004641829694774399, "time_ms": 2690.08469581604, "eta_seconds": 16113.60732793808, "eta": "4:28:33", "timestamp": 1765130936.1862507} +{"step": 4020, "loss": 3.753396511077881, "lr": 0.0004633643039777423, "time_ms": 2691.120147705078, "eta_seconds": 16092.898483276367, "eta": "4:28:12", "timestamp": 1765130963.0938582} +{"step": 4030, "loss": 3.710937738418579, "lr": 0.00046254401347608793, "time_ms": 2690.5758380889893, "eta_seconds": 16062.737753391266, "eta": "4:27:42", "timestamp": 1765130990.0085008} +{"step": 4040, "loss": 3.8796215057373047, "lr": 0.00046172210796745775, "time_ms": 2689.7482872009277, "eta_seconds": 16030.89979171753, "eta": "4:27:10", "timestamp": 1765131016.9218466} +{"step": 4050, "loss": 3.7172927856445312, "lr": 0.00046089859746651095, "time_ms": 2691.2314891815186, "eta_seconds": 16012.827360630035, "eta": "4:26:52", "timestamp": 1765131043.8395407} +{"step": 4060, "loss": 3.7235212326049805, "lr": 0.000460073492007463, "time_ms": 2690.394401550293, "eta_seconds": 15980.94274520874, "eta": "4:26:20", "timestamp": 1765131070.7555063} +{"step": 4070, "loss": 3.7379000186920166, "lr": 0.0004592468016439638, "time_ms": 2691.500663757324, "eta_seconds": 15960.598936080933, "eta": "4:26:00", "timestamp": 1765131097.6777644} +{"step": 4080, "loss": 3.676144599914551, "lr": 0.00045841853644897426, "time_ms": 2691.931962966919, "eta_seconds": 15936.23722076416, "eta": "4:25:36", "timestamp": 1765131124.5986722} +{"step": 4090, "loss": 3.731685161590576, "lr": 0.0004575887065146445, "time_ms": 2690.7286643981934, "eta_seconds": 15902.206406593323, "eta": "4:25:02", "timestamp": 1765131151.5156846} +{"step": 4100, "loss": 3.7531063556671143, "lr": 0.0004567573219521904, "time_ms": 2691.3938522338867, "eta_seconds": 15879.223728179932, "eta": "4:24:39", "timestamp": 1765131178.4387918} +{"step": 4110, "loss": 3.687319755554199, "lr": 0.00045592439289177057, "time_ms": 2692.075490951538, "eta_seconds": 15856.32464170456, "eta": "4:24:16", "timestamp": 1765131205.362227} +{"step": 4120, "loss": 3.6061697006225586, "lr": 0.0004550899294823626, "time_ms": 2691.354513168335, "eta_seconds": 15825.16453742981, "eta": "4:23:45", "timestamp": 1765131232.279605} +{"step": 4130, "loss": 3.7958741188049316, "lr": 0.0004542539418916399, "time_ms": 2692.117214202881, "eta_seconds": 15802.72804737091, "eta": "4:23:22", "timestamp": 1765131259.20077} +{"step": 4140, "loss": 3.8079843521118164, "lr": 0.0004534164403058474, "time_ms": 2692.65079498291, "eta_seconds": 15778.933658599854, "eta": "4:22:58", "timestamp": 1765131286.1246898} +{"step": 4150, "loss": 3.7453932762145996, "lr": 0.0004525774349296775, "time_ms": 2691.105842590332, "eta_seconds": 15742.969179153442, "eta": "4:22:22", "timestamp": 1765131313.0435195} +{"step": 4160, "loss": 3.583233118057251, "lr": 0.00045173693598614623, "time_ms": 2691.1144256591797, "eta_seconds": 15716.10824584961, "eta": "4:21:56", "timestamp": 1765131339.9580674} +{"step": 4170, "loss": 3.746497631072998, "lr": 0.0004508949537164677, "time_ms": 2691.181421279907, "eta_seconds": 15689.58768606186, "eta": "4:21:29", "timestamp": 1765131366.8762205} +{"step": 4180, "loss": 3.788916826248169, "lr": 0.00045005149837993035, "time_ms": 2691.7645931243896, "eta_seconds": 15666.069931983948, "eta": "4:21:06", "timestamp": 1765131393.7938888} +{"step": 4190, "loss": 3.6866350173950195, "lr": 0.00044920658025377115, "time_ms": 2691.6441917419434, "eta_seconds": 15638.452754020691, "eta": "4:20:38", "timestamp": 1765131420.7102985} +{"step": 4200, "loss": 3.801429271697998, "lr": 0.0004483602096330508, "time_ms": 2689.53013420105, "eta_seconds": 15599.274778366089, "eta": "4:19:59", "timestamp": 1765131447.6245162} +{"step": 4210, "loss": 3.8512394428253174, "lr": 0.0004475123968305284, "time_ms": 2690.6027793884277, "eta_seconds": 15578.590092658997, "eta": "4:19:38", "timestamp": 1765131474.5377495} +{"step": 4220, "loss": 3.8097519874572754, "lr": 0.0004466631521765352, "time_ms": 2690.2616024017334, "eta_seconds": 15549.712061882019, "eta": "4:19:09", "timestamp": 1765131501.4519029} +{"step": 4230, "loss": 3.8016459941864014, "lr": 0.0004458124860188493, "time_ms": 2691.106081008911, "eta_seconds": 15527.682087421417, "eta": "4:18:47", "timestamp": 1765131528.3677032} +{"step": 4240, "loss": 3.7269394397735596, "lr": 0.00044496040872256956, "time_ms": 2689.1136169433594, "eta_seconds": 15489.29443359375, "eta": "4:18:09", "timestamp": 1765131555.2831442} +{"step": 4250, "loss": 3.7691829204559326, "lr": 0.00044410693066998877, "time_ms": 2690.520763397217, "eta_seconds": 15470.494389533997, "eta": "4:17:50", "timestamp": 1765131582.1940727} +{"step": 4260, "loss": 3.6822264194488525, "lr": 0.00044325206226046777, "time_ms": 2690.135717391968, "eta_seconds": 15441.379017829895, "eta": "4:17:21", "timestamp": 1765131609.1076376} +{"step": 4270, "loss": 3.4620144367218018, "lr": 0.0004423958139103083, "time_ms": 2691.763401031494, "eta_seconds": 15423.804287910461, "eta": "4:17:03", "timestamp": 1765131636.024587} +{"step": 4280, "loss": 3.690488815307617, "lr": 0.00044153819605262623, "time_ms": 2690.535068511963, "eta_seconds": 15389.860591888428, "eta": "4:16:29", "timestamp": 1765131662.9388707} +{"step": 4290, "loss": 3.683811902999878, "lr": 0.00044067921913722456, "time_ms": 2691.499948501587, "eta_seconds": 15368.464705944061, "eta": "4:16:08", "timestamp": 1765131689.8555174} +{"step": 4300, "loss": 3.719294786453247, "lr": 0.00043981889363046604, "time_ms": 2691.3583278656006, "eta_seconds": 15340.742468833923, "eta": "4:15:40", "timestamp": 1765131716.772446} +{"step": 4310, "loss": 3.7546439170837402, "lr": 0.0004389572300151453, "time_ms": 2691.0135746002197, "eta_seconds": 15311.86723947525, "eta": "4:15:11", "timestamp": 1765131743.6859345} +{"step": 4320, "loss": 3.558096170425415, "lr": 0.00043809423879036165, "time_ms": 2692.0294761657715, "eta_seconds": 15290.727424621582, "eta": "4:14:50", "timestamp": 1765131770.6023629} +{"step": 4330, "loss": 3.6813108921051025, "lr": 0.00043722993047139066, "time_ms": 2690.706253051758, "eta_seconds": 15256.304454803467, "eta": "4:14:16", "timestamp": 1765131797.5129814} +{"step": 4340, "loss": 3.644679069519043, "lr": 0.0004363643155895567, "time_ms": 2689.854621887207, "eta_seconds": 15224.577159881592, "eta": "4:13:44", "timestamp": 1765131824.4241953} +{"step": 4350, "loss": 3.7940869331359863, "lr": 0.0004354974046921038, "time_ms": 2690.021276473999, "eta_seconds": 15198.620212078094, "eta": "4:13:18", "timestamp": 1765131851.3354547} +{"step": 4360, "loss": 3.725163459777832, "lr": 0.00043462920834206773, "time_ms": 2690.3862953186035, "eta_seconds": 15173.778705596924, "eta": "4:12:53", "timestamp": 1765131878.2414985} +{"step": 4370, "loss": 3.6847236156463623, "lr": 0.0004337597371181469, "time_ms": 2691.174030303955, "eta_seconds": 15151.309790611267, "eta": "4:12:31", "timestamp": 1765131905.144456} +{"step": 4380, "loss": 3.6675708293914795, "lr": 0.000432889001614574, "time_ms": 2688.9967918395996, "eta_seconds": 15112.16197013855, "eta": "4:11:52", "timestamp": 1765131932.0479836} +{"step": 4390, "loss": 3.5900614261627197, "lr": 0.0004320170124409861, "time_ms": 2689.131498336792, "eta_seconds": 15086.027705669403, "eta": "4:11:26", "timestamp": 1765131958.951026} +{"step": 4400, "loss": 3.723742961883545, "lr": 0.0004311437802222962, "time_ms": 2689.253807067871, "eta_seconds": 15059.821319580078, "eta": "4:10:59", "timestamp": 1765131985.8546593} +{"step": 4410, "loss": 3.684633731842041, "lr": 0.0004302693155985634, "time_ms": 2689.497709274292, "eta_seconds": 15034.292194843292, "eta": "4:10:34", "timestamp": 1765132012.7568798} +{"step": 4420, "loss": 3.8144142627716064, "lr": 0.00042939362922486305, "time_ms": 2690.350294113159, "eta_seconds": 15012.154641151428, "eta": "4:10:12", "timestamp": 1765132039.6624038} +{"step": 4430, "loss": 3.794452667236328, "lr": 0.00042851673177115717, "time_ms": 2690.729856491089, "eta_seconds": 14987.365300655365, "eta": "4:09:47", "timestamp": 1765132066.566616} +{"step": 4440, "loss": 3.6910510063171387, "lr": 0.0004276386339221648, "time_ms": 2691.023349761963, "eta_seconds": 14962.089824676514, "eta": "4:09:22", "timestamp": 1765132093.4712443} +{"step": 4450, "loss": 3.797473192214966, "lr": 0.00042675934637723096, "time_ms": 2689.7261142730713, "eta_seconds": 14927.979934215546, "eta": "4:08:47", "timestamp": 1765132120.3790872} +{"step": 4460, "loss": 3.614053249359131, "lr": 0.00042587887985019696, "time_ms": 2689.7714138031006, "eta_seconds": 14901.333632469177, "eta": "4:08:21", "timestamp": 1765132147.2910938} +{"step": 4470, "loss": 3.5825908184051514, "lr": 0.0004249972450692694, "time_ms": 2690.541982650757, "eta_seconds": 14878.697164058685, "eta": "4:07:58", "timestamp": 1765132174.2019687} +{"step": 4480, "loss": 3.76223087310791, "lr": 0.00042411445277689005, "time_ms": 2691.0266876220703, "eta_seconds": 14854.467315673828, "eta": "4:07:34", "timestamp": 1765132201.1143475} +{"step": 4490, "loss": 3.5288422107696533, "lr": 0.0004232305137296043, "time_ms": 2690.613269805908, "eta_seconds": 14825.279116630554, "eta": "4:07:05", "timestamp": 1765132228.0266478} +{"step": 4500, "loss": 3.7394018173217773, "lr": 0.00042234543869793054, "time_ms": 52835.423946380615, "eta_seconds": 290594.8317050934, "eta": "3 days, 8:43:14", "timestamp": 1765132305.0826526} +{"step": 4510, "loss": 3.6888904571533203, "lr": 0.00042145923846622865, "time_ms": 2689.213275909424, "eta_seconds": 14763.780884742737, "eta": "4:06:03", "timestamp": 1765132331.958578} +{"step": 4520, "loss": 3.742673397064209, "lr": 0.00042057192383256883, "time_ms": 2688.981771469116, "eta_seconds": 14735.620107650757, "eta": "4:05:35", "timestamp": 1765132358.8445804} +{"step": 4530, "loss": 3.5666768550872803, "lr": 0.0004196835056085998, "time_ms": 2689.249277114868, "eta_seconds": 14710.193545818329, "eta": "4:05:10", "timestamp": 1765132385.7341413} +{"step": 4540, "loss": 3.7068724632263184, "lr": 0.0004187939946194174, "time_ms": 2688.314914703369, "eta_seconds": 14678.199434280396, "eta": "4:04:38", "timestamp": 1765132412.6245885} +{"step": 4550, "loss": 3.741919994354248, "lr": 0.00041790340170343225, "time_ms": 2688.5008811950684, "eta_seconds": 14652.329802513123, "eta": "4:04:12", "timestamp": 1765132439.5178437} +{"step": 4560, "loss": 3.6236822605133057, "lr": 0.00041701173771223793, "time_ms": 2688.21120262146, "eta_seconds": 14623.868942260742, "eta": "4:03:43", "timestamp": 1765132466.4107673} +{"step": 4570, "loss": 3.6976287364959717, "lr": 0.0004161190135104788, "time_ms": 2688.253164291382, "eta_seconds": 14597.214682102203, "eta": "4:03:17", "timestamp": 1765132493.3032975} +{"step": 4580, "loss": 3.5981101989746094, "lr": 0.0004152252399757176, "time_ms": 2688.7383460998535, "eta_seconds": 14572.961835861206, "eta": "4:02:52", "timestamp": 1765132520.199587} +{"step": 4590, "loss": 3.773273468017578, "lr": 0.00041433042799830273, "time_ms": 2689.277172088623, "eta_seconds": 14548.98950099945, "eta": "4:02:28", "timestamp": 1765132547.0959566} +{"step": 4600, "loss": 3.6572299003601074, "lr": 0.00041343458848123576, "time_ms": 2689.8248195648193, "eta_seconds": 14525.054025650024, "eta": "4:02:05", "timestamp": 1765132573.990555} +{"step": 4610, "loss": 3.748236656188965, "lr": 0.0004125377323400385, "time_ms": 2690.0112628936768, "eta_seconds": 14499.160706996918, "eta": "4:01:39", "timestamp": 1765132600.8855057} +{"step": 4620, "loss": 3.683753252029419, "lr": 0.00041163987050261996, "time_ms": 2690.8910274505615, "eta_seconds": 14476.993727684021, "eta": "4:01:16", "timestamp": 1765132627.782611} +{"step": 4630, "loss": 3.602186679840088, "lr": 0.0004107410139091433, "time_ms": 2689.7497177124023, "eta_seconds": 14443.9559841156, "eta": "4:00:43", "timestamp": 1765132654.6779068} +{"step": 4640, "loss": 3.5017354488372803, "lr": 0.00040984117351189255, "time_ms": 2688.918352127075, "eta_seconds": 14412.602367401123, "eta": "4:00:12", "timestamp": 1765132681.577194} +{"step": 4650, "loss": 3.5024032592773438, "lr": 0.0004089403602751389, "time_ms": 2688.3182525634766, "eta_seconds": 14382.5026512146, "eta": "3:59:42", "timestamp": 1765132708.4720712} +{"step": 4660, "loss": 3.729384422302246, "lr": 0.00040803858517500724, "time_ms": 2688.2102489471436, "eta_seconds": 14355.042729377747, "eta": "3:59:15", "timestamp": 1765132735.366165} +{"step": 4670, "loss": 3.633435010910034, "lr": 0.0004071358591993428, "time_ms": 2687.92724609375, "eta_seconds": 14326.652221679688, "eta": "3:58:46", "timestamp": 1765132762.2587774} +{"step": 4680, "loss": 3.702911853790283, "lr": 0.00040623219334757663, "time_ms": 2689.734697341919, "eta_seconds": 14309.388589859009, "eta": "3:58:29", "timestamp": 1765132789.1539128} +{"step": 4690, "loss": 3.7450530529022217, "lr": 0.00040532759863059185, "time_ms": 2688.692331314087, "eta_seconds": 14276.956279277802, "eta": "3:57:56", "timestamp": 1765132816.0452218} +{"step": 4700, "loss": 3.6070058345794678, "lr": 0.0004044220860705897, "time_ms": 2687.9639625549316, "eta_seconds": 14246.209001541138, "eta": "3:57:26", "timestamp": 1765132842.9364643} +{"step": 4710, "loss": 3.6779093742370605, "lr": 0.000403515666700955, "time_ms": 2689.465045928955, "eta_seconds": 14227.270092964172, "eta": "3:57:07", "timestamp": 1765132869.8300054} +{"step": 4720, "loss": 3.6126866340637207, "lr": 0.00040260835156612164, "time_ms": 2688.528537750244, "eta_seconds": 14195.430679321289, "eta": "3:56:35", "timestamp": 1765132896.714823} +{"step": 4730, "loss": 3.727400779724121, "lr": 0.0004017001517214383, "time_ms": 2689.570426940918, "eta_seconds": 14174.036149978638, "eta": "3:56:14", "timestamp": 1765132923.6012564} +{"step": 4740, "loss": 3.6715781688690186, "lr": 0.0004007910782330334, "time_ms": 2687.185764312744, "eta_seconds": 14134.597120285034, "eta": "3:55:34", "timestamp": 1765132950.47923} +{"step": 4750, "loss": 3.762518882751465, "lr": 0.00039988114217768053, "time_ms": 2688.2247924804688, "eta_seconds": 14113.180160522461, "eta": "3:55:13", "timestamp": 1765132977.3575473} +{"step": 4760, "loss": 3.656032085418701, "lr": 0.0003989703546426634, "time_ms": 2686.2051486968994, "eta_seconds": 14075.714979171753, "eta": "3:54:35", "timestamp": 1765133004.228529} +{"step": 4770, "loss": 3.674248695373535, "lr": 0.0003980587267256407, "time_ms": 2687.01434135437, "eta_seconds": 14053.085005283356, "eta": "3:54:13", "timestamp": 1765133031.107609} +{"step": 4780, "loss": 3.839123487472534, "lr": 0.0003971462695345108, "time_ms": 2687.1285438537598, "eta_seconds": 14026.810998916626, "eta": "3:53:46", "timestamp": 1765133057.9905605} +{"step": 4790, "loss": 3.7343015670776367, "lr": 0.00039623299418727666, "time_ms": 2687.562942504883, "eta_seconds": 14002.20293045044, "eta": "3:53:22", "timestamp": 1765133084.8717842} +{"step": 4800, "loss": 3.703749656677246, "lr": 0.0003953189118119102, "time_ms": 2686.3160133361816, "eta_seconds": 13968.843269348145, "eta": "3:52:48", "timestamp": 1765133111.7510839} +{"step": 4810, "loss": 3.6845035552978516, "lr": 0.0003944040335462168, "time_ms": 2688.3597373962402, "eta_seconds": 13952.587037086487, "eta": "3:52:32", "timestamp": 1765133138.6244907} +{"step": 4820, "loss": 3.624732732772827, "lr": 0.0003934883705376992, "time_ms": 2687.98565864563, "eta_seconds": 13923.765711784363, "eta": "3:52:03", "timestamp": 1765133165.5085223} +{"step": 4830, "loss": 3.540260076522827, "lr": 0.00039257193394342236, "time_ms": 2688.1237030029297, "eta_seconds": 13897.599544525146, "eta": "3:51:37", "timestamp": 1765133192.3979034} +{"step": 4840, "loss": 3.729161262512207, "lr": 0.000391654734929877, "time_ms": 2689.1982555389404, "eta_seconds": 13876.262998580933, "eta": "3:51:16", "timestamp": 1765133219.2929945} +{"step": 4850, "loss": 3.524585008621216, "lr": 0.0003907367846728435, "time_ms": 2688.002109527588, "eta_seconds": 13843.210864067078, "eta": "3:50:43", "timestamp": 1765133246.1885238} +{"step": 4860, "loss": 3.5102083683013916, "lr": 0.00038981809435725617, "time_ms": 2690.5956268310547, "eta_seconds": 13829.661521911621, "eta": "3:50:29", "timestamp": 1765133273.0832515} +{"step": 4870, "loss": 3.489262342453003, "lr": 0.0003888986751770665, "time_ms": 2688.401460647583, "eta_seconds": 13791.4994931221, "eta": "3:49:51", "timestamp": 1765133299.9803004} +{"step": 4880, "loss": 3.605618953704834, "lr": 0.00038797853833510705, "time_ms": 2688.619375228882, "eta_seconds": 13765.731201171875, "eta": "3:49:25", "timestamp": 1765133326.876789} +{"step": 4890, "loss": 3.6356160640716553, "lr": 0.0003870576950429549, "time_ms": 2690.476417541504, "eta_seconds": 13748.334493637085, "eta": "3:49:08", "timestamp": 1765133353.7733371} +{"step": 4900, "loss": 3.746793746948242, "lr": 0.0003861361565207949, "time_ms": 2689.4776821136475, "eta_seconds": 13716.336178779602, "eta": "3:48:36", "timestamp": 1765133380.6702557} +{"step": 4910, "loss": 3.538569211959839, "lr": 0.0003852139339972833, "time_ms": 2689.546585083008, "eta_seconds": 13689.79211807251, "eta": "3:48:09", "timestamp": 1765133407.5650713} +{"step": 4920, "loss": 3.735692024230957, "lr": 0.00038429103870941044, "time_ms": 2689.227819442749, "eta_seconds": 13661.277322769165, "eta": "3:47:41", "timestamp": 1765133434.4595904} +{"step": 4930, "loss": 3.6047887802124023, "lr": 0.000383367481902364, "time_ms": 2689.7823810577393, "eta_seconds": 13637.196671962738, "eta": "3:47:17", "timestamp": 1765133461.3596952} +{"step": 4940, "loss": 3.6860291957855225, "lr": 0.00038244327482939237, "time_ms": 2689.9020671844482, "eta_seconds": 13610.904459953308, "eta": "3:46:50", "timestamp": 1765133488.2604053} +{"step": 4950, "loss": 3.6189258098602295, "lr": 0.00038151842875166705, "time_ms": 2688.0903244018555, "eta_seconds": 13574.85613822937, "eta": "3:46:14", "timestamp": 1765133515.1632204} +{"step": 4960, "loss": 3.7083232402801514, "lr": 0.0003805929549381456, "time_ms": 2689.7940635681152, "eta_seconds": 13556.5620803833, "eta": "3:45:56", "timestamp": 1765133542.0648975} +{"step": 4970, "loss": 3.5750045776367188, "lr": 0.0003796668646654344, "time_ms": 2689.423084259033, "eta_seconds": 13527.798113822937, "eta": "3:45:27", "timestamp": 1765133568.96247} +{"step": 4980, "loss": 3.666093349456787, "lr": 0.00037874016921765114, "time_ms": 2689.0923976898193, "eta_seconds": 13499.243836402893, "eta": "3:44:59", "timestamp": 1765133595.8614056} +{"step": 4990, "loss": 3.5773444175720215, "lr": 0.00037781287988628747, "time_ms": 2689.1860961914062, "eta_seconds": 13472.822341918945, "eta": "3:44:32", "timestamp": 1765133622.7615159} +{"step": 5000, "loss": 3.7257821559906006, "lr": 0.0003768850079700712, "time_ms": 52581.78186416626, "eta_seconds": 262908.9093208313, "eta": "3 days, 1:01:48", "timestamp": 1765133699.5519943} +{"step": 5010, "loss": 3.542142152786255, "lr": 0.00037595656477482873, "time_ms": 2689.9776458740234, "eta_seconds": 13422.988452911377, "eta": "3:43:42", "timestamp": 1765133726.4440432} +{"step": 5020, "loss": 3.7951886653900146, "lr": 0.00037502756161334757, "time_ms": 2690.965175628662, "eta_seconds": 13401.006574630737, "eta": "3:43:21", "timestamp": 1765133753.3563886} +{"step": 5030, "loss": 3.6452577114105225, "lr": 0.00037409800980523796, "time_ms": 2691.1027431488037, "eta_seconds": 13374.780633449554, "eta": "3:42:54", "timestamp": 1765133780.2688036} +{"step": 5040, "loss": 3.554370403289795, "lr": 0.00037316792067679537, "time_ms": 2691.336154937744, "eta_seconds": 13349.027328491211, "eta": "3:42:29", "timestamp": 1765133807.18365} +{"step": 5050, "loss": 3.5373544692993164, "lr": 0.0003722373055608623, "time_ms": 2691.718101501465, "eta_seconds": 13324.004602432251, "eta": "3:42:04", "timestamp": 1765133834.1000252} +{"step": 5060, "loss": 3.7190749645233154, "lr": 0.00037130617579669026, "time_ms": 2691.373825073242, "eta_seconds": 13295.386695861816, "eta": "3:41:35", "timestamp": 1765133861.016614} +{"step": 5070, "loss": 3.7271039485931396, "lr": 0.00037037454272980156, "time_ms": 2690.6025409698486, "eta_seconds": 13264.670526981354, "eta": "3:41:04", "timestamp": 1765133887.931213} +{"step": 5080, "loss": 3.595651626586914, "lr": 0.0003694424177118511, "time_ms": 2691.08247756958, "eta_seconds": 13240.125789642334, "eta": "3:40:40", "timestamp": 1765133914.8438132} +{"step": 5090, "loss": 3.5822927951812744, "lr": 0.00036850981210048814, "time_ms": 2690.4544830322266, "eta_seconds": 13210.131511688232, "eta": "3:40:10", "timestamp": 1765133941.757768} +{"step": 5100, "loss": 3.6888294219970703, "lr": 0.0003675767372592176, "time_ms": 2690.885066986084, "eta_seconds": 13185.336828231812, "eta": "3:39:45", "timestamp": 1765133968.6702192} +{"step": 5110, "loss": 3.708026170730591, "lr": 0.0003666432045572621, "time_ms": 2691.297769546509, "eta_seconds": 13160.446093082428, "eta": "3:39:20", "timestamp": 1765133995.5863457} +{"step": 5120, "loss": 3.609689712524414, "lr": 0.000365709225369423, "time_ms": 2690.6983852386475, "eta_seconds": 13130.6081199646, "eta": "3:38:50", "timestamp": 1765134022.4995964} +{"step": 5130, "loss": 3.6129369735717773, "lr": 0.0003647748110759419, "time_ms": 2691.5807723999023, "eta_seconds": 13107.998361587524, "eta": "3:38:27", "timestamp": 1765134049.412281} +{"step": 5140, "loss": 3.6125664710998535, "lr": 0.0003638399730623621, "time_ms": 2690.838098526001, "eta_seconds": 13077.473158836365, "eta": "3:37:57", "timestamp": 1765134076.3256607} +{"step": 5150, "loss": 3.556455612182617, "lr": 0.00036290472271938975, "time_ms": 2690.521717071533, "eta_seconds": 13049.030327796936, "eta": "3:37:29", "timestamp": 1765134103.2395844} +{"step": 5160, "loss": 3.559642791748047, "lr": 0.00036196907144275527, "time_ms": 2691.500663757324, "eta_seconds": 13026.86321258545, "eta": "3:37:06", "timestamp": 1765134130.1513612} +{"step": 5170, "loss": 3.739997386932373, "lr": 0.00036103303063307396, "time_ms": 2691.232204437256, "eta_seconds": 12998.651547431946, "eta": "3:36:38", "timestamp": 1765134157.0646527} +{"step": 5180, "loss": 3.605043411254883, "lr": 0.0003600966116957078, "time_ms": 2691.287040710449, "eta_seconds": 12972.003536224365, "eta": "3:36:12", "timestamp": 1765134183.9792662} +{"step": 5190, "loss": 3.5504047870635986, "lr": 0.0003591598260406261, "time_ms": 2690.8276081085205, "eta_seconds": 12942.880795001984, "eta": "3:35:42", "timestamp": 1765134210.8934479} +{"step": 5200, "loss": 3.7031657695770264, "lr": 0.0003582226850822664, "time_ms": 2690.4296875, "eta_seconds": 12914.0625, "eta": "3:35:14", "timestamp": 1765134237.8051395} +{"step": 5210, "loss": 3.702183246612549, "lr": 0.0003572852002393954, "time_ms": 2690.2732849121094, "eta_seconds": 12886.409034729004, "eta": "3:34:46", "timestamp": 1765134264.7169812} +{"step": 5220, "loss": 3.6444849967956543, "lr": 0.00035634738293497027, "time_ms": 2690.819025039673, "eta_seconds": 12862.114939689636, "eta": "3:34:22", "timestamp": 1765134291.6287286} +{"step": 5230, "loss": 3.5154550075531006, "lr": 0.0003554092445959989, "time_ms": 2690.9828186035156, "eta_seconds": 12835.98804473877, "eta": "3:33:55", "timestamp": 1765134318.5392542} +{"step": 5240, "loss": 3.5562376976013184, "lr": 0.00035447079665340065, "time_ms": 2690.6721591949463, "eta_seconds": 12807.599477767944, "eta": "3:33:27", "timestamp": 1765134345.450094} +{"step": 5250, "loss": 3.5435311794281006, "lr": 0.0003535320505418677, "time_ms": 2691.4737224578857, "eta_seconds": 12784.500181674957, "eta": "3:33:04", "timestamp": 1765134372.3617225} +{"step": 5260, "loss": 3.4482171535491943, "lr": 0.0003525930176997252, "time_ms": 2690.9825801849365, "eta_seconds": 12755.2574300766, "eta": "3:32:35", "timestamp": 1765134399.2738454} +{"step": 5270, "loss": 3.573338031768799, "lr": 0.0003516537095687918, "time_ms": 2691.0290718078613, "eta_seconds": 12728.567509651184, "eta": "3:32:08", "timestamp": 1765134426.183103} +{"step": 5280, "loss": 3.453293800354004, "lr": 0.000350714137594241, "time_ms": 2691.270589828491, "eta_seconds": 12702.797183990479, "eta": "3:31:42", "timestamp": 1765134453.0956957} +{"step": 5290, "loss": 3.386354923248291, "lr": 0.0003497743132244605, "time_ms": 2691.0953521728516, "eta_seconds": 12675.05910873413, "eta": "3:31:15", "timestamp": 1765134480.0062447} +{"step": 5300, "loss": 3.625610113143921, "lr": 0.00034883424791091376, "time_ms": 2691.385507583618, "eta_seconds": 12649.511885643005, "eta": "3:30:49", "timestamp": 1765134506.9182758} +{"step": 5310, "loss": 3.6599838733673096, "lr": 0.000347893953108, "time_ms": 2691.44344329834, "eta_seconds": 12622.869749069214, "eta": "3:30:22", "timestamp": 1765134533.8315687} +{"step": 5320, "loss": 3.6538469791412354, "lr": 0.0003469534402729146, "time_ms": 2690.709352493286, "eta_seconds": 12592.51976966858, "eta": "3:29:52", "timestamp": 1765134560.7447782} +{"step": 5330, "loss": 3.521974802017212, "lr": 0.0003460127208655096, "time_ms": 2691.0040378570557, "eta_seconds": 12566.98885679245, "eta": "3:29:26", "timestamp": 1765134587.657234} +{"step": 5340, "loss": 3.5887739658355713, "lr": 0.00034507180634815417, "time_ms": 2691.312313079834, "eta_seconds": 12541.515378952026, "eta": "3:29:01", "timestamp": 1765134614.57289} +{"step": 5350, "loss": 3.584489345550537, "lr": 0.0003441307081855948, "time_ms": 2691.162586212158, "eta_seconds": 12513.906025886536, "eta": "3:28:33", "timestamp": 1765134641.4851027} +{"step": 5360, "loss": 3.561399459838867, "lr": 0.00034318943784481556, "time_ms": 2691.8368339538574, "eta_seconds": 12490.122909545898, "eta": "3:28:10", "timestamp": 1765134668.3996296} +{"step": 5370, "loss": 3.488069534301758, "lr": 0.00034224800679489843, "time_ms": 2690.742254257202, "eta_seconds": 12458.136637210846, "eta": "3:27:38", "timestamp": 1765134695.3139925} +{"step": 5380, "loss": 3.6524055004119873, "lr": 0.00034130642650688383, "time_ms": 2690.9713745117188, "eta_seconds": 12432.28775024414, "eta": "3:27:12", "timestamp": 1765134722.227537} +{"step": 5390, "loss": 3.6533589363098145, "lr": 0.00034036470845363035, "time_ms": 2690.3886795043945, "eta_seconds": 12402.691812515259, "eta": "3:26:42", "timestamp": 1765134749.1396384} +{"step": 5400, "loss": 3.6962716579437256, "lr": 0.00033942286410967523, "time_ms": 2691.002607345581, "eta_seconds": 12378.611993789673, "eta": "3:26:18", "timestamp": 1765134776.05364} +{"step": 5410, "loss": 3.6455960273742676, "lr": 0.0003384809049510946, "time_ms": 2691.554307937622, "eta_seconds": 12354.234273433685, "eta": "3:25:54", "timestamp": 1765134802.9682937} +{"step": 5420, "loss": 3.681647300720215, "lr": 0.0003375388424553636, "time_ms": 2690.5853748321533, "eta_seconds": 12322.881016731262, "eta": "3:25:22", "timestamp": 1765134829.880953} +{"step": 5430, "loss": 3.55768084526062, "lr": 0.00033659668810121635, "time_ms": 2691.570043563843, "eta_seconds": 12300.475099086761, "eta": "3:25:00", "timestamp": 1765134856.79589} +{"step": 5440, "loss": 3.6998679637908936, "lr": 0.0003356544533685063, "time_ms": 2691.070079803467, "eta_seconds": 12271.279563903809, "eta": "3:24:31", "timestamp": 1765134883.712521} +{"step": 5450, "loss": 3.6796979904174805, "lr": 0.00033471214973806654, "time_ms": 2690.3443336486816, "eta_seconds": 12241.066718101501, "eta": "3:24:01", "timestamp": 1765134910.626955} +{"step": 5460, "loss": 3.465418815612793, "lr": 0.00033376978869156923, "time_ms": 2690.81449508667, "eta_seconds": 12216.297807693481, "eta": "3:23:36", "timestamp": 1765134937.5447066} +{"step": 5470, "loss": 3.5215020179748535, "lr": 0.0003328273817113863, "time_ms": 2691.711902618408, "eta_seconds": 12193.45491886139, "eta": "3:23:13", "timestamp": 1765134964.4632533} +{"step": 5480, "loss": 3.6753509044647217, "lr": 0.00033188494028044954, "time_ms": 2691.852569580078, "eta_seconds": 12167.173614501953, "eta": "3:22:47", "timestamp": 1765134991.381116} +{"step": 5490, "loss": 3.6809167861938477, "lr": 0.00033094247588211033, "time_ms": 2690.8998489379883, "eta_seconds": 12135.958318710327, "eta": "3:22:15", "timestamp": 1765135018.2981236} +{"step": 5500, "loss": 3.5302722454071045, "lr": 0.00032999999999999994, "time_ms": 52576.611042022705, "eta_seconds": 236594.74968910217, "eta": "2 days, 17:43:14", "timestamp": 1765135095.0994575} +{"step": 5510, "loss": 3.47719407081604, "lr": 0.0003290575241178896, "time_ms": 2689.6615028381348, "eta_seconds": 12076.580147743225, "eta": "3:21:16", "timestamp": 1765135121.997743} +{"step": 5520, "loss": 3.4518444538116455, "lr": 0.00032811505971955035, "time_ms": 2690.2384757995605, "eta_seconds": 12052.268371582031, "eta": "3:20:52", "timestamp": 1765135148.9055982} +{"step": 5530, "loss": 3.5136008262634277, "lr": 0.00032717261828861364, "time_ms": 2691.2851333618164, "eta_seconds": 12030.04454612732, "eta": "3:20:30", "timestamp": 1765135175.8210351} +{"step": 5540, "loss": 3.5563414096832275, "lr": 0.00032623021130843077, "time_ms": 2691.0250186920166, "eta_seconds": 12001.971583366394, "eta": "3:20:01", "timestamp": 1765135202.7330117} +{"step": 5550, "loss": 3.6759562492370605, "lr": 0.0003252878502619334, "time_ms": 2691.375970840454, "eta_seconds": 11976.62307024002, "eta": "3:19:36", "timestamp": 1765135229.6491694} +{"step": 5560, "loss": 3.55159068107605, "lr": 0.00032434554663149357, "time_ms": 2690.844774246216, "eta_seconds": 11947.350797653198, "eta": "3:19:07", "timestamp": 1765135256.5626936} +{"step": 5570, "loss": 3.5696797370910645, "lr": 0.0003234033118987836, "time_ms": 2690.2518272399902, "eta_seconds": 11917.815594673157, "eta": "3:18:37", "timestamp": 1765135283.4719698} +{"step": 5580, "loss": 3.462432384490967, "lr": 0.0003224611575446364, "time_ms": 2690.0012493133545, "eta_seconds": 11889.805521965027, "eta": "3:18:09", "timestamp": 1765135310.3723302} +{"step": 5590, "loss": 3.528493881225586, "lr": 0.0003215190950489053, "time_ms": 2690.448760986328, "eta_seconds": 11864.879035949707, "eta": "3:17:44", "timestamp": 1765135337.2803304} +{"step": 5600, "loss": 3.5367424488067627, "lr": 0.00032057713589032477, "time_ms": 2691.7104721069336, "eta_seconds": 11843.526077270508, "eta": "3:17:23", "timestamp": 1765135364.1947973} +{"step": 5610, "loss": 3.557140350341797, "lr": 0.0003196352915463696, "time_ms": 2690.4520988464355, "eta_seconds": 11811.084713935852, "eta": "3:16:51", "timestamp": 1765135391.108985} +{"step": 5620, "loss": 3.679509401321411, "lr": 0.0003186935734931161, "time_ms": 2690.5295848846436, "eta_seconds": 11784.519581794739, "eta": "3:16:24", "timestamp": 1765135418.0220127} +{"step": 5630, "loss": 3.5390427112579346, "lr": 0.00031775199320510146, "time_ms": 2690.4664039611816, "eta_seconds": 11757.338185310364, "eta": "3:15:57", "timestamp": 1765135444.9338422} +{"step": 5640, "loss": 3.549666166305542, "lr": 0.0003168105621551844, "time_ms": 2691.5361881256104, "eta_seconds": 11735.097780227661, "eta": "3:15:35", "timestamp": 1765135471.8506742} +{"step": 5650, "loss": 3.452528715133667, "lr": 0.0003158692918144051, "time_ms": 2691.936492919922, "eta_seconds": 11709.92374420166, "eta": "3:15:09", "timestamp": 1765135498.7670135} +{"step": 5660, "loss": 3.5731427669525146, "lr": 0.0003149281936518457, "time_ms": 2691.01881980896, "eta_seconds": 11679.021677970886, "eta": "3:14:39", "timestamp": 1765135525.6815767} +{"step": 5670, "loss": 3.5008463859558105, "lr": 0.00031398727913449037, "time_ms": 2690.396308898926, "eta_seconds": 11649.416017532349, "eta": "3:14:09", "timestamp": 1765135552.5939834} +{"step": 5680, "loss": 3.604156255722046, "lr": 0.00031304655972708536, "time_ms": 2690.6421184539795, "eta_seconds": 11623.573951721191, "eta": "3:13:43", "timestamp": 1765135579.5066154} +{"step": 5690, "loss": 3.6722640991210938, "lr": 0.000312106046892, "time_ms": 2690.938949584961, "eta_seconds": 11597.946872711182, "eta": "3:13:17", "timestamp": 1765135606.415784} +{"step": 5700, "loss": 3.57108736038208, "lr": 0.0003111657520890861, "time_ms": 2690.972089767456, "eta_seconds": 11571.179986000061, "eta": "3:12:51", "timestamp": 1765135633.3254635} +{"step": 5710, "loss": 3.3976991176605225, "lr": 0.00031022568677553945, "time_ms": 2690.9594535827637, "eta_seconds": 11544.216055870056, "eta": "3:12:24", "timestamp": 1765135660.2352664} +{"step": 5720, "loss": 3.566011667251587, "lr": 0.0003092858624057589, "time_ms": 2689.6755695343018, "eta_seconds": 11511.811437606812, "eta": "3:11:51", "timestamp": 1765135687.1390398} +{"step": 5730, "loss": 3.5751349925994873, "lr": 0.0003083462904312081, "time_ms": 2690.4115676879883, "eta_seconds": 11488.05739402771, "eta": "3:11:28", "timestamp": 1765135714.047868} +{"step": 5740, "loss": 3.542179584503174, "lr": 0.0003074069823002748, "time_ms": 2690.650224685669, "eta_seconds": 11462.16995716095, "eta": "3:11:02", "timestamp": 1765135740.9563076} +{"step": 5750, "loss": 3.53115177154541, "lr": 0.0003064679494581322, "time_ms": 2691.366672515869, "eta_seconds": 11438.308358192444, "eta": "3:10:38", "timestamp": 1765135767.8695307} +{"step": 5760, "loss": 3.4548020362854004, "lr": 0.00030552920334659935, "time_ms": 2690.9806728363037, "eta_seconds": 11409.758052825928, "eta": "3:10:09", "timestamp": 1765135794.7828577} +{"step": 5770, "loss": 3.466799020767212, "lr": 0.0003045907554040011, "time_ms": 2690.652847290039, "eta_seconds": 11381.461544036865, "eta": "3:09:41", "timestamp": 1765135821.695936} +{"step": 5780, "loss": 3.623839855194092, "lr": 0.0003036526170650296, "time_ms": 2690.976619720459, "eta_seconds": 11355.921335220337, "eta": "3:09:15", "timestamp": 1765135848.6091266} +{"step": 5790, "loss": 3.4901771545410156, "lr": 0.0003027147997606044, "time_ms": 2691.4124488830566, "eta_seconds": 11330.846409797668, "eta": "3:08:50", "timestamp": 1765135875.5232847} +{"step": 5800, "loss": 3.520242214202881, "lr": 0.0003017773149177336, "time_ms": 2691.011428833008, "eta_seconds": 11302.248001098633, "eta": "3:08:22", "timestamp": 1765135902.4373362} +{"step": 5810, "loss": 3.4153010845184326, "lr": 0.0003008401739593738, "time_ms": 2690.1180744171143, "eta_seconds": 11271.594731807709, "eta": "3:07:51", "timestamp": 1765135929.348228} +{"step": 5820, "loss": 3.5906379222869873, "lr": 0.0002999033883042921, "time_ms": 2690.873861312866, "eta_seconds": 11247.85274028778, "eta": "3:07:27", "timestamp": 1765135956.2592945} +{"step": 5830, "loss": 3.5189883708953857, "lr": 0.00029896696936692604, "time_ms": 2690.685510635376, "eta_seconds": 11220.158579349518, "eta": "3:07:00", "timestamp": 1765135983.1734595} +{"step": 5840, "loss": 3.4467554092407227, "lr": 0.0002980309285572447, "time_ms": 2691.347360610962, "eta_seconds": 11196.005020141602, "eta": "3:06:36", "timestamp": 1765136010.0850573} +{"step": 5850, "loss": 3.50405216217041, "lr": 0.0002970952772806102, "time_ms": 2690.5264854431152, "eta_seconds": 11165.684914588928, "eta": "3:06:05", "timestamp": 1765136036.9971087} +{"step": 5860, "loss": 3.5450353622436523, "lr": 0.0002961600269376378, "time_ms": 2690.7989978790283, "eta_seconds": 11139.907851219177, "eta": "3:05:39", "timestamp": 1765136063.9078057} +{"step": 5870, "loss": 3.5115067958831787, "lr": 0.000295225188924058, "time_ms": 2690.887212753296, "eta_seconds": 11113.364188671112, "eta": "3:05:13", "timestamp": 1765136090.822061} +{"step": 5880, "loss": 3.4926419258117676, "lr": 0.00029429077463057686, "time_ms": 2691.183567047119, "eta_seconds": 11087.67629623413, "eta": "3:04:47", "timestamp": 1765136117.7357597} +{"step": 5890, "loss": 3.4198520183563232, "lr": 0.0002933567954427378, "time_ms": 2690.520763397217, "eta_seconds": 11058.040337562561, "eta": "3:04:18", "timestamp": 1765136144.6472695} +{"step": 5900, "loss": 3.39607834815979, "lr": 0.00029242326274078235, "time_ms": 2691.889762878418, "eta_seconds": 11036.748027801514, "eta": "3:03:56", "timestamp": 1765136171.5595486} +{"step": 5910, "loss": 3.486295461654663, "lr": 0.00029149018789951186, "time_ms": 2691.2500858306885, "eta_seconds": 11007.212851047516, "eta": "3:03:27", "timestamp": 1765136198.471256} +{"step": 5920, "loss": 3.5351791381835938, "lr": 0.00029055758228814884, "time_ms": 2690.2341842651367, "eta_seconds": 10976.155471801758, "eta": "3:02:56", "timestamp": 1765136225.380978} +{"step": 5930, "loss": 3.517378568649292, "lr": 0.00028962545727019844, "time_ms": 2690.452814102173, "eta_seconds": 10950.142953395844, "eta": "3:02:30", "timestamp": 1765136252.2944407} +{"step": 5940, "loss": 3.538886070251465, "lr": 0.00028869382420330974, "time_ms": 2691.1075115203857, "eta_seconds": 10925.896496772766, "eta": "3:02:05", "timestamp": 1765136279.207934} +{"step": 5950, "loss": 3.495985269546509, "lr": 0.0002877626944391376, "time_ms": 2690.7451152801514, "eta_seconds": 10897.517716884613, "eta": "3:01:37", "timestamp": 1765136306.119894} +{"step": 5960, "loss": 3.47821307182312, "lr": 0.0002868320793232046, "time_ms": 2690.6440258026123, "eta_seconds": 10870.201864242554, "eta": "3:01:10", "timestamp": 1765136333.03338} +{"step": 5970, "loss": 3.4509494304656982, "lr": 0.00028590199019476204, "time_ms": 2691.258430480957, "eta_seconds": 10845.771474838257, "eta": "3:00:45", "timestamp": 1765136359.9470375} +{"step": 5980, "loss": 3.3957533836364746, "lr": 0.0002849724383866524, "time_ms": 2690.866470336914, "eta_seconds": 10817.283210754395, "eta": "3:00:17", "timestamp": 1765136386.8625252} +{"step": 5990, "loss": 3.508836030960083, "lr": 0.0002840434352251712, "time_ms": 2690.6838417053223, "eta_seconds": 10789.642205238342, "eta": "2:59:49", "timestamp": 1765136413.7767856} +{"step": 6000, "loss": 3.420541286468506, "lr": 0.0002831149920299288, "time_ms": 49932.13629722595, "eta_seconds": 199728.5451889038, "eta": "2 days, 7:28:48", "timestamp": 1765136487.9343574} +{"step": 6010, "loss": 3.5173749923706055, "lr": 0.0002821871201137125, "time_ms": 2690.7994747161865, "eta_seconds": 10736.289904117584, "eta": "2:58:56", "timestamp": 1765136514.8519993} +{"step": 6020, "loss": 3.449103832244873, "lr": 0.0002812598307823488, "time_ms": 2691.9167041778564, "eta_seconds": 10713.828482627869, "eta": "2:58:33", "timestamp": 1765136541.768577} +{"step": 6030, "loss": 3.450855255126953, "lr": 0.0002803331353345655, "time_ms": 2691.0555362701416, "eta_seconds": 10683.490478992462, "eta": "2:58:03", "timestamp": 1765136568.686697} +{"step": 6040, "loss": 3.6312997341156006, "lr": 0.0002794070450618543, "time_ms": 2690.6723976135254, "eta_seconds": 10655.06269454956, "eta": "2:57:35", "timestamp": 1765136595.6024075} +{"step": 6050, "loss": 3.5521318912506104, "lr": 0.00027848157124833284, "time_ms": 2691.484212875366, "eta_seconds": 10631.362640857697, "eta": "2:57:11", "timestamp": 1765136622.5150135} +{"step": 6060, "loss": 3.3981292247772217, "lr": 0.0002775567251706076, "time_ms": 2690.9704208374023, "eta_seconds": 10602.423458099365, "eta": "2:56:42", "timestamp": 1765136649.426829} +{"step": 6070, "loss": 3.4012625217437744, "lr": 0.0002766325180976359, "time_ms": 2690.406084060669, "eta_seconds": 10573.295910358429, "eta": "2:56:13", "timestamp": 1765136676.457454} +{"step": 6080, "loss": 3.4841156005859375, "lr": 0.00027570896129058955, "time_ms": 2690.422296524048, "eta_seconds": 10546.455402374268, "eta": "2:55:46", "timestamp": 1765136703.3687441} +{"step": 6090, "loss": 3.562171697616577, "lr": 0.0002747860660027166, "time_ms": 2690.1891231536865, "eta_seconds": 10518.639471530914, "eta": "2:55:18", "timestamp": 1765136730.2756002} +{"step": 6100, "loss": 3.4397482872009277, "lr": 0.000273863843479205, "time_ms": 2691.225051879883, "eta_seconds": 10495.777702331543, "eta": "2:54:55", "timestamp": 1765136757.1817033} +{"step": 6110, "loss": 3.3686983585357666, "lr": 0.00027294230495704505, "time_ms": 2691.2291049957275, "eta_seconds": 10468.88121843338, "eta": "2:54:28", "timestamp": 1765136784.08812} +{"step": 6120, "loss": 3.5265955924987793, "lr": 0.0002720214616648929, "time_ms": 2690.2337074279785, "eta_seconds": 10438.106784820557, "eta": "2:53:58", "timestamp": 1765136810.9956677} +{"step": 6130, "loss": 3.418337106704712, "lr": 0.00027110132482293357, "time_ms": 2690.641164779663, "eta_seconds": 10412.781307697296, "eta": "2:53:32", "timestamp": 1765136837.9036672} +{"step": 6140, "loss": 3.587554454803467, "lr": 0.00027018190564274383, "time_ms": 2689.9335384368896, "eta_seconds": 10383.143458366394, "eta": "2:53:03", "timestamp": 1765136864.8120534} +{"step": 6150, "loss": 3.52272367477417, "lr": 0.00026926321532715644, "time_ms": 2690.4046535491943, "eta_seconds": 10358.057916164398, "eta": "2:52:38", "timestamp": 1765136891.7211206} +{"step": 6160, "loss": 3.4360411167144775, "lr": 0.0002683452650701229, "time_ms": 2690.574884414673, "eta_seconds": 10331.807556152344, "eta": "2:52:11", "timestamp": 1765136918.6282754} +{"step": 6170, "loss": 3.596872329711914, "lr": 0.00026742806605657753, "time_ms": 2690.356492996216, "eta_seconds": 10304.065368175507, "eta": "2:51:44", "timestamp": 1765136945.7092066} +{"step": 6180, "loss": 3.4629976749420166, "lr": 0.0002665116294623007, "time_ms": 2690.537691116333, "eta_seconds": 10277.853980064392, "eta": "2:51:17", "timestamp": 1765136972.9452841} +{"step": 6190, "loss": 3.4176108837127686, "lr": 0.0002655959664537832, "time_ms": 2691.2598609924316, "eta_seconds": 10253.700070381165, "eta": "2:50:53", "timestamp": 1765136999.8562398} +{"step": 6200, "loss": 3.418454885482788, "lr": 0.0002646810881880897, "time_ms": 2690.2472972869873, "eta_seconds": 10222.939729690552, "eta": "2:50:22", "timestamp": 1765137026.9345005} +{"step": 6210, "loss": 3.422356367111206, "lr": 0.0002637670058127233, "time_ms": 2690.185070037842, "eta_seconds": 10195.80141544342, "eta": "2:49:55", "timestamp": 1765137054.0333781} +{"step": 6220, "loss": 3.482009172439575, "lr": 0.0002628537304654892, "time_ms": 2690.160036087036, "eta_seconds": 10168.804936408997, "eta": "2:49:28", "timestamp": 1765137081.1671216} +{"step": 6230, "loss": 3.3580284118652344, "lr": 0.00026194127327435927, "time_ms": 2690.991163253784, "eta_seconds": 10145.036685466766, "eta": "2:49:05", "timestamp": 1765137108.0795379} +{"step": 6240, "loss": 3.493834972381592, "lr": 0.00026102964535733655, "time_ms": 2691.3583278656006, "eta_seconds": 10119.507312774658, "eta": "2:48:39", "timestamp": 1765137134.9926016} +{"step": 6250, "loss": 3.403848886489868, "lr": 0.00026011885782231935, "time_ms": 2690.4566287994385, "eta_seconds": 10089.212357997894, "eta": "2:48:09", "timestamp": 1765137161.9050312} +{"step": 6260, "loss": 3.581848621368408, "lr": 0.00025920892176696655, "time_ms": 2691.0581588745117, "eta_seconds": 10064.557514190674, "eta": "2:47:44", "timestamp": 1765137188.820753} +{"step": 6270, "loss": 3.3920047283172607, "lr": 0.00025829984827856157, "time_ms": 2690.9828186035156, "eta_seconds": 10037.365913391113, "eta": "2:47:17", "timestamp": 1765137215.7328825} +{"step": 6280, "loss": 3.361009120941162, "lr": 0.00025739164843387825, "time_ms": 2690.1159286499023, "eta_seconds": 10007.231254577637, "eta": "2:46:47", "timestamp": 1765137242.6456976} +{"step": 6290, "loss": 3.570831298828125, "lr": 0.0002564843332990449, "time_ms": 2691.154718399048, "eta_seconds": 9984.184005260468, "eta": "2:46:24", "timestamp": 1765137269.5559573} +{"step": 6300, "loss": 3.3538503646850586, "lr": 0.00025557791392941023, "time_ms": 2690.3018951416016, "eta_seconds": 9954.117012023926, "eta": "2:45:54", "timestamp": 1765137296.4656863} +{"step": 6310, "loss": 3.3225929737091064, "lr": 0.0002546724013694081, "time_ms": 2690.835952758789, "eta_seconds": 9929.184665679932, "eta": "2:45:29", "timestamp": 1765137323.37827} +{"step": 6320, "loss": 3.4126877784729004, "lr": 0.0002537678066524233, "time_ms": 2691.6141510009766, "eta_seconds": 9905.140075683594, "eta": "2:45:05", "timestamp": 1765137350.2913} +{"step": 6330, "loss": 3.43868350982666, "lr": 0.00025286414080065715, "time_ms": 2690.4664039611816, "eta_seconds": 9874.011702537537, "eta": "2:44:34", "timestamp": 1765137377.2030513} +{"step": 6340, "loss": 3.546349287033081, "lr": 0.0002519614148249926, "time_ms": 2690.73486328125, "eta_seconds": 9848.089599609375, "eta": "2:44:08", "timestamp": 1765137404.1149092} +{"step": 6350, "loss": 3.3371284008026123, "lr": 0.00025105963972486107, "time_ms": 2690.469264984131, "eta_seconds": 9820.212817192078, "eta": "2:43:40", "timestamp": 1765137431.023756} +{"step": 6360, "loss": 3.4704344272613525, "lr": 0.00025015882648810744, "time_ms": 2690.5317306518555, "eta_seconds": 9793.535499572754, "eta": "2:43:13", "timestamp": 1765137457.9332569} +{"step": 6370, "loss": 3.412588357925415, "lr": 0.00024925898609085657, "time_ms": 2690.7315254211426, "eta_seconds": 9767.355437278748, "eta": "2:42:47", "timestamp": 1765137484.8431323} +{"step": 6380, "loss": 3.4235095977783203, "lr": 0.00024836012949738, "time_ms": 2691.0908222198486, "eta_seconds": 9741.748776435852, "eta": "2:42:21", "timestamp": 1765137511.753994} +{"step": 6390, "loss": 3.4516563415527344, "lr": 0.00024746226765996147, "time_ms": 2690.2689933776855, "eta_seconds": 9711.871066093445, "eta": "2:41:51", "timestamp": 1765137538.663548} +{"step": 6400, "loss": 3.6397013664245605, "lr": 0.0002465654115187642, "time_ms": 2691.5698051452637, "eta_seconds": 9689.65129852295, "eta": "2:41:29", "timestamp": 1765137565.5754323} +{"step": 6410, "loss": 3.5247018337249756, "lr": 0.00024566957200169716, "time_ms": 2690.1957988739014, "eta_seconds": 9657.802917957306, "eta": "2:40:57", "timestamp": 1765137592.486338} +{"step": 6420, "loss": 3.442823886871338, "lr": 0.00024477476002428234, "time_ms": 2690.631151199341, "eta_seconds": 9632.45952129364, "eta": "2:40:32", "timestamp": 1765137619.399767} +{"step": 6430, "loss": 3.549304485321045, "lr": 0.00024388098648952104, "time_ms": 2691.136360168457, "eta_seconds": 9607.356805801392, "eta": "2:40:07", "timestamp": 1765137646.3128839} +{"step": 6440, "loss": 3.496286392211914, "lr": 0.000242988262287762, "time_ms": 2690.791606903076, "eta_seconds": 9579.218120574951, "eta": "2:39:39", "timestamp": 1765137673.225103} +{"step": 6450, "loss": 3.4224905967712402, "lr": 0.00024209659829656772, "time_ms": 2690.9985542297363, "eta_seconds": 9553.044867515564, "eta": "2:39:13", "timestamp": 1765137700.139099} +{"step": 6460, "loss": 3.4913291931152344, "lr": 0.00024120600538058248, "time_ms": 2691.7998790740967, "eta_seconds": 9528.971571922302, "eta": "2:38:48", "timestamp": 1765137727.3012466} +{"step": 6470, "loss": 3.53629207611084, "lr": 0.00024031649439140015, "time_ms": 2691.9453144073486, "eta_seconds": 9502.56695985794, "eta": "2:38:22", "timestamp": 1765137754.8785405} +{"step": 6480, "loss": 3.414605140686035, "lr": 0.00023942807616743114, "time_ms": 2688.736915588379, "eta_seconds": 9464.353942871094, "eta": "2:37:44", "timestamp": 1765137781.9615412} +{"step": 6490, "loss": 3.224918842315674, "lr": 0.0002385407615337713, "time_ms": 2689.650535583496, "eta_seconds": 9440.673379898071, "eta": "2:37:20", "timestamp": 1765137809.1476462} +{"step": 6500, "loss": 3.5934042930603027, "lr": 0.00023765456130206942, "time_ms": 50520.64752578735, "eta_seconds": 176822.26634025574, "eta": "2 days, 1:07:02", "timestamp": 1765137884.3252578} +{"step": 6510, "loss": 3.4796619415283203, "lr": 0.0002367694862703956, "time_ms": 2691.5335655212402, "eta_seconds": 9393.452143669128, "eta": "2:36:33", "timestamp": 1765137911.2393227} +{"step": 6520, "loss": 3.4967548847198486, "lr": 0.00023588554722310992, "time_ms": 2691.171407699585, "eta_seconds": 9365.276498794556, "eta": "2:36:05", "timestamp": 1765137938.1511428} +{"step": 6530, "loss": 3.4703867435455322, "lr": 0.00023500275493073048, "time_ms": 2690.8864974975586, "eta_seconds": 9337.376146316528, "eta": "2:35:37", "timestamp": 1765137965.0618584} +{"step": 6540, "loss": 3.431929588317871, "lr": 0.000234121120149803, "time_ms": 2691.1063194274902, "eta_seconds": 9311.227865219116, "eta": "2:35:11", "timestamp": 1765137991.9766192} +{"step": 6550, "loss": 3.5372202396392822, "lr": 0.0002332406536227689, "time_ms": 2690.883159637451, "eta_seconds": 9283.546900749207, "eta": "2:34:43", "timestamp": 1765138018.8878684} +{"step": 6560, "loss": 3.578564405441284, "lr": 0.00023236136607783509, "time_ms": 2690.8552646636963, "eta_seconds": 9256.542110443115, "eta": "2:34:16", "timestamp": 1765138045.7962327} +{"step": 6570, "loss": 3.37480092048645, "lr": 0.00023148326822884264, "time_ms": 2690.608024597168, "eta_seconds": 9228.785524368286, "eta": "2:33:48", "timestamp": 1765138072.705673} +{"step": 6580, "loss": 3.4870028495788574, "lr": 0.00023060637077513692, "time_ms": 2690.0150775909424, "eta_seconds": 9199.851565361023, "eta": "2:33:19", "timestamp": 1765138099.6185937} +{"step": 6590, "loss": 3.4104645252227783, "lr": 0.00022973068440143663, "time_ms": 2690.4587745666504, "eta_seconds": 9174.464421272278, "eta": "2:32:54", "timestamp": 1765138126.5306067} +{"step": 6600, "loss": 3.4747934341430664, "lr": 0.0002288562197777037, "time_ms": 2690.45090675354, "eta_seconds": 9147.533082962036, "eta": "2:32:27", "timestamp": 1765138153.440386} +{"step": 6610, "loss": 3.358769655227661, "lr": 0.00022798298755901387, "time_ms": 2690.47212600708, "eta_seconds": 9120.700507164001, "eta": "2:32:00", "timestamp": 1765138180.3481312} +{"step": 6620, "loss": 3.4173970222473145, "lr": 0.00022711099838542597, "time_ms": 2690.3164386749268, "eta_seconds": 9093.269562721252, "eta": "2:31:33", "timestamp": 1765138207.2555819} +{"step": 6630, "loss": 3.418813943862915, "lr": 0.00022624026288185298, "time_ms": 2691.021203994751, "eta_seconds": 9068.74145746231, "eta": "2:31:08", "timestamp": 1765138234.167421} +{"step": 6640, "loss": 3.5241851806640625, "lr": 0.00022537079165793218, "time_ms": 2690.8278465270996, "eta_seconds": 9041.181564331055, "eta": "2:30:41", "timestamp": 1765138261.0751827} +{"step": 6650, "loss": 3.396704912185669, "lr": 0.0002245025953078961, "time_ms": 2690.7339096069336, "eta_seconds": 9013.958597183228, "eta": "2:30:13", "timestamp": 1765138287.9824767} +{"step": 6660, "loss": 3.400761127471924, "lr": 0.00022363568441044316, "time_ms": 2690.4428005218506, "eta_seconds": 8986.078953742981, "eta": "2:29:46", "timestamp": 1765138314.8933117} +{"step": 6670, "loss": 3.3927133083343506, "lr": 0.00022277006952860923, "time_ms": 2690.653085708618, "eta_seconds": 8959.874775409698, "eta": "2:29:19", "timestamp": 1765138341.804742} +{"step": 6680, "loss": 3.4570531845092773, "lr": 0.00022190576120963837, "time_ms": 2690.1838779449463, "eta_seconds": 8931.410474777222, "eta": "2:28:51", "timestamp": 1765138368.716449} +{"step": 6690, "loss": 3.331723690032959, "lr": 0.00022104276998485465, "time_ms": 2690.9339427948, "eta_seconds": 8906.991350650787, "eta": "2:28:26", "timestamp": 1765138395.6301634} +{"step": 6700, "loss": 3.4251439571380615, "lr": 0.00022018110636953396, "time_ms": 2690.526247024536, "eta_seconds": 8878.73661518097, "eta": "2:27:58", "timestamp": 1765138422.544396} +{"step": 6710, "loss": 3.37251615524292, "lr": 0.0002193207808627753, "time_ms": 2690.7920837402344, "eta_seconds": 8852.705955505371, "eta": "2:27:32", "timestamp": 1765138449.4587204} +{"step": 6720, "loss": 3.432312250137329, "lr": 0.00021846180394737371, "time_ms": 2690.998315811157, "eta_seconds": 8826.474475860596, "eta": "2:27:06", "timestamp": 1765138476.3716955} +{"step": 6730, "loss": 3.4787094593048096, "lr": 0.00021760418608969168, "time_ms": 2689.2764568328857, "eta_seconds": 8793.934013843536, "eta": "2:26:33", "timestamp": 1765138503.2757113} +{"step": 6740, "loss": 3.5033011436462402, "lr": 0.00021674793773953215, "time_ms": 2690.3882026672363, "eta_seconds": 8770.66554069519, "eta": "2:26:10", "timestamp": 1765138530.1803086} +{"step": 6750, "loss": 3.482980966567993, "lr": 0.00021589306933001115, "time_ms": 2691.4172172546387, "eta_seconds": 8747.105956077576, "eta": "2:25:47", "timestamp": 1765138557.0927937} +{"step": 6760, "loss": 3.512728691101074, "lr": 0.00021503959127743035, "time_ms": 2691.1158561706543, "eta_seconds": 8719.21537399292, "eta": "2:25:19", "timestamp": 1765138584.0053189} +{"step": 6770, "loss": 3.3874425888061523, "lr": 0.00021418751398115062, "time_ms": 2690.653085708618, "eta_seconds": 8690.809466838837, "eta": "2:24:50", "timestamp": 1765138610.918395} +{"step": 6780, "loss": 3.3097598552703857, "lr": 0.0002133368478234647, "time_ms": 2691.4594173431396, "eta_seconds": 8666.49932384491, "eta": "2:24:26", "timestamp": 1765138637.8316422} +{"step": 6790, "loss": 3.2920711040496826, "lr": 0.00021248760316947156, "time_ms": 2691.2152767181396, "eta_seconds": 8638.801038265228, "eta": "2:23:58", "timestamp": 1765138664.7445552} +{"step": 6800, "loss": 3.2818877696990967, "lr": 0.00021163979036694904, "time_ms": 2690.382242202759, "eta_seconds": 8609.223175048828, "eta": "2:23:29", "timestamp": 1765138691.6563742} +{"step": 6810, "loss": 3.3885483741760254, "lr": 0.00021079341974622877, "time_ms": 2690.7308101654053, "eta_seconds": 8583.431284427643, "eta": "2:23:03", "timestamp": 1765138718.5673316} +{"step": 6820, "loss": 3.300163984298706, "lr": 0.00020994850162006962, "time_ms": 2690.467357635498, "eta_seconds": 8555.686197280884, "eta": "2:22:35", "timestamp": 1765138745.4761074} +{"step": 6830, "loss": 3.4955670833587646, "lr": 0.00020910504628353217, "time_ms": 2690.2706623077393, "eta_seconds": 8528.157999515533, "eta": "2:22:08", "timestamp": 1765138772.386369} +{"step": 6840, "loss": 3.530777931213379, "lr": 0.00020826306401385371, "time_ms": 2691.678762435913, "eta_seconds": 8505.704889297485, "eta": "2:21:45", "timestamp": 1765138799.2986186} +{"step": 6850, "loss": 3.528226613998413, "lr": 0.00020742256507032234, "time_ms": 2691.2434101104736, "eta_seconds": 8477.416741847992, "eta": "2:21:17", "timestamp": 1765138826.2078502} +{"step": 6860, "loss": 3.5991218090057373, "lr": 0.0002065835596941526, "time_ms": 2690.7272338867188, "eta_seconds": 8448.883514404297, "eta": "2:20:48", "timestamp": 1765138853.1209967} +{"step": 6870, "loss": 3.4468417167663574, "lr": 0.00020574605810836003, "time_ms": 2691.3506984710693, "eta_seconds": 8423.927686214447, "eta": "2:20:23", "timestamp": 1765138880.0342999} +{"step": 6880, "loss": 3.417487144470215, "lr": 0.00020491007051763737, "time_ms": 2690.481424331665, "eta_seconds": 8394.302043914795, "eta": "2:19:54", "timestamp": 1765138906.946102} +{"step": 6890, "loss": 3.351123809814453, "lr": 0.00020407560710822937, "time_ms": 2690.4654502868652, "eta_seconds": 8367.34755039215, "eta": "2:19:27", "timestamp": 1765138933.859647} +{"step": 6900, "loss": 3.500756025314331, "lr": 0.0002032426780478095, "time_ms": 2691.810369491577, "eta_seconds": 8344.61214542389, "eta": "2:19:04", "timestamp": 1765138960.7724724} +{"step": 6910, "loss": 3.400543451309204, "lr": 0.00020241129348535543, "time_ms": 2691.0245418548584, "eta_seconds": 8315.265834331512, "eta": "2:18:35", "timestamp": 1765138987.6829927} +{"step": 6920, "loss": 3.509866237640381, "lr": 0.00020158146355102563, "time_ms": 2691.68758392334, "eta_seconds": 8290.397758483887, "eta": "2:18:10", "timestamp": 1765139014.5929778} +{"step": 6930, "loss": 3.461097478866577, "lr": 0.00020075319835603615, "time_ms": 2692.187786102295, "eta_seconds": 8265.016503334045, "eta": "2:17:45", "timestamp": 1765139041.504754} +{"step": 6940, "loss": 3.554655075073242, "lr": 0.0001999265079925368, "time_ms": 2690.359592437744, "eta_seconds": 8232.500352859497, "eta": "2:17:12", "timestamp": 1765139068.4150267} +{"step": 6950, "loss": 3.4832096099853516, "lr": 0.00019910140253348897, "time_ms": 2691.049814224243, "eta_seconds": 8207.701933383942, "eta": "2:16:47", "timestamp": 1765139095.3257563} +{"step": 6960, "loss": 3.327665090560913, "lr": 0.00019827789203254208, "time_ms": 2690.674066543579, "eta_seconds": 8179.6491622924805, "eta": "2:16:19", "timestamp": 1765139122.2342753} +{"step": 6970, "loss": 3.427402973175049, "lr": 0.00019745598652391196, "time_ms": 2690.64998626709, "eta_seconds": 8152.669458389282, "eta": "2:15:52", "timestamp": 1765139149.1467342} +{"step": 6980, "loss": 3.51924467086792, "lr": 0.00019663569602225767, "time_ms": 2690.398931503296, "eta_seconds": 8125.004773139954, "eta": "2:15:25", "timestamp": 1765139176.0588627} +{"step": 6990, "loss": 3.3873050212860107, "lr": 0.00019581703052256002, "time_ms": 2691.2336349487305, "eta_seconds": 8100.613241195679, "eta": "2:15:00", "timestamp": 1765139202.973045} +{"step": 7000, "loss": 3.3779006004333496, "lr": 0.00019500000000000002, "time_ms": 52693.54796409607, "eta_seconds": 158080.6438922882, "eta": "1 day, 19:54:40", "timestamp": 1765139279.8888164} +{"step": 7010, "loss": 3.4047203063964844, "lr": 0.0001941846144098365, "time_ms": 2689.473867416382, "eta_seconds": 8041.526863574982, "eta": "2:14:01", "timestamp": 1765139306.7843802} +{"step": 7020, "loss": 3.431291103363037, "lr": 0.00019337088368728578, "time_ms": 2690.838575363159, "eta_seconds": 8018.698954582214, "eta": "2:13:38", "timestamp": 1765139333.691375} +{"step": 7030, "loss": 3.3528175354003906, "lr": 0.00019255881774739972, "time_ms": 2691.3273334503174, "eta_seconds": 7993.242180347443, "eta": "2:13:13", "timestamp": 1765139360.6043997} +{"step": 7040, "loss": 3.3947906494140625, "lr": 0.0001917484264849457, "time_ms": 2690.993070602417, "eta_seconds": 7965.339488983154, "eta": "2:12:45", "timestamp": 1765139387.5174377} +{"step": 7050, "loss": 3.348944664001465, "lr": 0.0001909397197742853, "time_ms": 2689.373254776001, "eta_seconds": 7933.651101589203, "eta": "2:12:13", "timestamp": 1765139414.4295855} +{"step": 7060, "loss": 3.446909189224243, "lr": 0.00019013270746925487, "time_ms": 2689.7435188293457, "eta_seconds": 7907.845945358276, "eta": "2:11:47", "timestamp": 1765139441.3404639} +{"step": 7070, "loss": 3.5647950172424316, "lr": 0.00018932739940304445, "time_ms": 2690.2451515197754, "eta_seconds": 7882.418293952942, "eta": "2:11:22", "timestamp": 1765139468.2523808} +{"step": 7080, "loss": 3.410280704498291, "lr": 0.00018852380538807864, "time_ms": 2690.3297901153564, "eta_seconds": 7855.762987136841, "eta": "2:10:55", "timestamp": 1765139495.1633945} +{"step": 7090, "loss": 3.4991438388824463, "lr": 0.000187721935215897, "time_ms": 2691.9405460357666, "eta_seconds": 7833.546988964081, "eta": "2:10:33", "timestamp": 1765139522.0790448} +{"step": 7100, "loss": 3.414989471435547, "lr": 0.00018692179865703468, "time_ms": 2691.0266876220703, "eta_seconds": 7803.977394104004, "eta": "2:10:03", "timestamp": 1765139548.994254} +{"step": 7110, "loss": 3.414426803588867, "lr": 0.00018612340546090284, "time_ms": 2690.990924835205, "eta_seconds": 7776.963772773743, "eta": "2:09:36", "timestamp": 1765139575.9101315} +{"step": 7120, "loss": 3.385707378387451, "lr": 0.0001853267653556708, "time_ms": 2691.0157203674316, "eta_seconds": 7750.125274658203, "eta": "2:09:10", "timestamp": 1765139602.8216069} +{"step": 7130, "loss": 3.4088165760040283, "lr": 0.0001845318880481469, "time_ms": 2691.04266166687, "eta_seconds": 7723.292438983917, "eta": "2:08:43", "timestamp": 1765139629.7337077} +{"step": 7140, "loss": 3.349766492843628, "lr": 0.00018373878322366024, "time_ms": 2690.937280654907, "eta_seconds": 7696.080622673035, "eta": "2:08:16", "timestamp": 1765139656.648402} +{"step": 7150, "loss": 3.4881389141082764, "lr": 0.00018294746054594267, "time_ms": 2691.4827823638916, "eta_seconds": 7670.725929737091, "eta": "2:07:50", "timestamp": 1765139683.5654588} +{"step": 7160, "loss": 3.3947136402130127, "lr": 0.00018215792965701143, "time_ms": 2691.3199424743652, "eta_seconds": 7643.348636627197, "eta": "2:07:23", "timestamp": 1765139710.4785044} +{"step": 7170, "loss": 3.5066614151000977, "lr": 0.00018137020017705116, "time_ms": 2690.8187866210938, "eta_seconds": 7615.017166137695, "eta": "2:06:55", "timestamp": 1765139737.3927987} +{"step": 7180, "loss": 3.4828622341156006, "lr": 0.0001805842817042971, "time_ms": 2690.6745433807373, "eta_seconds": 7587.702212333679, "eta": "2:06:27", "timestamp": 1765139764.3068912} +{"step": 7190, "loss": 3.446274518966675, "lr": 0.00017980018381491767, "time_ms": 2690.5159950256348, "eta_seconds": 7560.349946022034, "eta": "2:06:00", "timestamp": 1765139791.2189028} +{"step": 7200, "loss": 3.291308641433716, "lr": 0.00017901791606289837, "time_ms": 2690.6518936157227, "eta_seconds": 7533.825302124023, "eta": "2:05:33", "timestamp": 1765139818.1338491} +{"step": 7210, "loss": 3.3550214767456055, "lr": 0.0001782374879799248, "time_ms": 2691.518783569336, "eta_seconds": 7509.337406158447, "eta": "2:05:09", "timestamp": 1765139845.0488987} +{"step": 7220, "loss": 3.3011016845703125, "lr": 0.00017745890907526675, "time_ms": 2691.135883331299, "eta_seconds": 7481.357755661011, "eta": "2:04:41", "timestamp": 1765139871.9632144} +{"step": 7230, "loss": 3.4803550243377686, "lr": 0.0001766821888356627, "time_ms": 2690.9759044647217, "eta_seconds": 7454.003255367279, "eta": "2:04:14", "timestamp": 1765139898.8780613} +{"step": 7240, "loss": 3.25938081741333, "lr": 0.00017590733672520346, "time_ms": 2690.915107727051, "eta_seconds": 7426.92569732666, "eta": "2:03:46", "timestamp": 1765139925.7927275} +{"step": 7250, "loss": 3.410045623779297, "lr": 0.0001751343621852176, "time_ms": 2692.6283836364746, "eta_seconds": 7404.728055000305, "eta": "2:03:24", "timestamp": 1765139952.704084} +{"step": 7260, "loss": 3.4541642665863037, "lr": 0.00017436327463415583, "time_ms": 2690.4516220092773, "eta_seconds": 7371.83744430542, "eta": "2:02:51", "timestamp": 1765139979.6159945} +{"step": 7270, "loss": 3.3238883018493652, "lr": 0.00017359408346747675, "time_ms": 2691.049814224243, "eta_seconds": 7346.565992832184, "eta": "2:02:26", "timestamp": 1765140006.5298138} +{"step": 7280, "loss": 3.5215630531311035, "lr": 0.00017282679805753187, "time_ms": 2690.7224655151367, "eta_seconds": 7318.765106201172, "eta": "2:01:58", "timestamp": 1765140033.4420207} +{"step": 7290, "loss": 3.410937547683716, "lr": 0.0001720614277534518, "time_ms": 2691.1821365356445, "eta_seconds": 7293.103590011597, "eta": "2:01:33", "timestamp": 1765140060.353301} +{"step": 7300, "loss": 3.3720624446868896, "lr": 0.00017129798188103226, "time_ms": 2690.778970718384, "eta_seconds": 7265.103220939636, "eta": "2:01:05", "timestamp": 1765140087.2620037} +{"step": 7310, "loss": 3.3123180866241455, "lr": 0.0001705364697426201, "time_ms": 2690.0556087493896, "eta_seconds": 7236.249587535858, "eta": "2:00:36", "timestamp": 1765140114.1726437} +{"step": 7320, "loss": 3.47444486618042, "lr": 0.0001697769006170006, "time_ms": 2691.086530685425, "eta_seconds": 7212.1119022369385, "eta": "2:00:12", "timestamp": 1765140141.0849643} +{"step": 7330, "loss": 3.4373276233673096, "lr": 0.0001690192837592837, "time_ms": 2690.976142883301, "eta_seconds": 7184.906301498413, "eta": "1:59:44", "timestamp": 1765140167.996844} +{"step": 7340, "loss": 3.2812440395355225, "lr": 0.00016826362840079184, "time_ms": 2690.662622451782, "eta_seconds": 7157.162575721741, "eta": "1:59:17", "timestamp": 1765140194.9082737} +{"step": 7350, "loss": 3.488464593887329, "lr": 0.00016750994374894692, "time_ms": 2690.763473510742, "eta_seconds": 7130.523204803467, "eta": "1:58:50", "timestamp": 1765140221.8200698} +{"step": 7360, "loss": 3.372711658477783, "lr": 0.0001667582389871588, "time_ms": 2690.429210662842, "eta_seconds": 7102.733116149902, "eta": "1:58:22", "timestamp": 1765140248.733195} +{"step": 7370, "loss": 3.4508445262908936, "lr": 0.00016600852327471264, "time_ms": 2691.5693283081055, "eta_seconds": 7078.827333450317, "eta": "1:57:58", "timestamp": 1765140275.6465728} +{"step": 7380, "loss": 3.4506311416625977, "lr": 0.00016526080574665774, "time_ms": 2691.171407699585, "eta_seconds": 7050.869088172913, "eta": "1:57:30", "timestamp": 1765140302.5597878} +{"step": 7390, "loss": 3.483416795730591, "lr": 0.00016451509551369638, "time_ms": 2690.142869949341, "eta_seconds": 7021.2728905677795, "eta": "1:57:01", "timestamp": 1765140329.4721122} +{"step": 7400, "loss": 3.323662042617798, "lr": 0.00016377140166207226, "time_ms": 2691.178321838379, "eta_seconds": 6997.063636779785, "eta": "1:56:37", "timestamp": 1765140356.3861651} +{"step": 7410, "loss": 3.5495169162750244, "lr": 0.00016302973325346042, "time_ms": 2690.55438041687, "eta_seconds": 6968.535845279694, "eta": "1:56:08", "timestamp": 1765140383.3018422} +{"step": 7420, "loss": 3.265690326690674, "lr": 0.0001622900993248562, "time_ms": 2691.5721893310547, "eta_seconds": 6944.256248474121, "eta": "1:55:44", "timestamp": 1765140410.2174435} +{"step": 7430, "loss": 3.27311110496521, "lr": 0.00016155250888846576, "time_ms": 2691.286087036133, "eta_seconds": 6916.605243682861, "eta": "1:55:16", "timestamp": 1765140437.131801} +{"step": 7440, "loss": 3.474173069000244, "lr": 0.00016081697093159574, "time_ms": 2691.8373107910156, "eta_seconds": 6891.103515625, "eta": "1:54:51", "timestamp": 1765140464.0454822} +{"step": 7450, "loss": 3.390735149383545, "lr": 0.0001600834944165439, "time_ms": 2691.8647289276123, "eta_seconds": 6864.255058765411, "eta": "1:54:24", "timestamp": 1765140490.9593303} +{"step": 7460, "loss": 3.4436347484588623, "lr": 0.00015935208828049023, "time_ms": 2690.653085708618, "eta_seconds": 6834.25883769989, "eta": "1:53:54", "timestamp": 1765140517.872479} +{"step": 7470, "loss": 3.391531229019165, "lr": 0.00015862276143538775, "time_ms": 2691.469192504883, "eta_seconds": 6809.4170570373535, "eta": "1:53:29", "timestamp": 1765140544.787212} +{"step": 7480, "loss": 3.4062657356262207, "lr": 0.00015789552276785376, "time_ms": 2691.530704498291, "eta_seconds": 6782.657375335693, "eta": "1:53:02", "timestamp": 1765140571.7027333} +{"step": 7490, "loss": 3.35864520072937, "lr": 0.00015717038113906195, "time_ms": 2690.7763481140137, "eta_seconds": 6753.848633766174, "eta": "1:52:33", "timestamp": 1765140598.6169944} +{"step": 7500, "loss": 3.3165578842163086, "lr": 0.00015644734538463435, "time_ms": 52860.53800582886, "eta_seconds": 132151.34501457214, "eta": "1 day, 12:42:31", "timestamp": 1765140675.701124} +{"step": 7510, "loss": 3.3213443756103516, "lr": 0.0001557264243145333, "time_ms": 2690.7448768615723, "eta_seconds": 6699.954743385315, "eta": "1:51:39", "timestamp": 1765140702.5932043} +{"step": 7520, "loss": 3.371352195739746, "lr": 0.00015500762671295465, "time_ms": 2690.690755844116, "eta_seconds": 6672.913074493408, "eta": "1:51:12", "timestamp": 1765140729.5002313} +{"step": 7530, "loss": 3.5109429359436035, "lr": 0.00015429096133822025, "time_ms": 2691.580057144165, "eta_seconds": 6648.202741146088, "eta": "1:50:48", "timestamp": 1765140756.412794} +{"step": 7540, "loss": 3.4200916290283203, "lr": 0.0001535764369226715, "time_ms": 2690.995931625366, "eta_seconds": 6619.849991798401, "eta": "1:50:19", "timestamp": 1765140783.3267214} +{"step": 7550, "loss": 3.48549485206604, "lr": 0.00015286406217256306, "time_ms": 2689.958333969116, "eta_seconds": 6590.397918224335, "eta": "1:49:50", "timestamp": 1765140810.2409973} +{"step": 7560, "loss": 3.393724203109741, "lr": 0.00015215384576795622, "time_ms": 2690.884590148926, "eta_seconds": 6565.758399963379, "eta": "1:49:25", "timestamp": 1765140837.1541073} +{"step": 7570, "loss": 3.3120131492614746, "lr": 0.00015144579636261403, "time_ms": 2691.758632659912, "eta_seconds": 6540.973477363586, "eta": "1:49:00", "timestamp": 1765140864.067697} +{"step": 7580, "loss": 3.3397738933563232, "lr": 0.00015073992258389475, "time_ms": 2690.357208251953, "eta_seconds": 6510.664443969727, "eta": "1:48:30", "timestamp": 1765140890.9801624} +{"step": 7590, "loss": 3.3119640350341797, "lr": 0.00015003623303264785, "time_ms": 2690.8910274505615, "eta_seconds": 6485.047376155853, "eta": "1:48:05", "timestamp": 1765140917.8958201} +{"step": 7600, "loss": 3.4343881607055664, "lr": 0.00014933473628310834, "time_ms": 2690.966844558716, "eta_seconds": 6458.320426940918, "eta": "1:47:38", "timestamp": 1765140944.8103833} +{"step": 7610, "loss": 3.4073452949523926, "lr": 0.00014863544088279267, "time_ms": 2690.5505657196045, "eta_seconds": 6430.415852069855, "eta": "1:47:10", "timestamp": 1765140971.72428} +{"step": 7620, "loss": 3.444519519805908, "lr": 0.00014793835535239475, "time_ms": 2690.5899047851562, "eta_seconds": 6403.603973388672, "eta": "1:46:43", "timestamp": 1765140998.6365268} +{"step": 7630, "loss": 3.4623537063598633, "lr": 0.00014724348818568163, "time_ms": 2690.2520656585693, "eta_seconds": 6375.897395610809, "eta": "1:46:15", "timestamp": 1765141025.5508633} +{"step": 7640, "loss": 3.486971855163574, "lr": 0.0001465508478493906, "time_ms": 2690.7687187194824, "eta_seconds": 6350.2141761779785, "eta": "1:45:50", "timestamp": 1765141052.4630315} +{"step": 7650, "loss": 3.3233399391174316, "lr": 0.00014586044278312542, "time_ms": 2690.946578979492, "eta_seconds": 6323.724460601807, "eta": "1:45:23", "timestamp": 1765141079.3760257} +{"step": 7660, "loss": 3.2917320728302, "lr": 0.00014517228139925402, "time_ms": 2691.3602352142334, "eta_seconds": 6297.782950401306, "eta": "1:44:57", "timestamp": 1765141106.2885172} +{"step": 7670, "loss": 3.333756446838379, "lr": 0.00014448637208280582, "time_ms": 2690.81974029541, "eta_seconds": 6269.609994888306, "eta": "1:44:29", "timestamp": 1765141133.2053807} +{"step": 7680, "loss": 3.4497272968292236, "lr": 0.00014380272319136915, "time_ms": 2690.258026123047, "eta_seconds": 6241.398620605469, "eta": "1:44:01", "timestamp": 1765141160.1226168} +{"step": 7690, "loss": 3.26739501953125, "lr": 0.0001431213430549902, "time_ms": 2690.9334659576416, "eta_seconds": 6216.056306362152, "eta": "1:43:36", "timestamp": 1765141187.036327} +{"step": 7700, "loss": 3.2567079067230225, "lr": 0.0001424422399760707, "time_ms": 2692.0411586761475, "eta_seconds": 6191.694664955139, "eta": "1:43:11", "timestamp": 1765141213.951032} +{"step": 7710, "loss": 3.347151041030884, "lr": 0.00014176542222926758, "time_ms": 2693.072557449341, "eta_seconds": 6167.1361565589905, "eta": "1:42:47", "timestamp": 1765141240.8657546} +{"step": 7720, "loss": 3.4606809616088867, "lr": 0.0001410908980613913, "time_ms": 2691.3838386535645, "eta_seconds": 6136.355152130127, "eta": "1:42:16", "timestamp": 1765141267.7831967} +{"step": 7730, "loss": 3.2836639881134033, "lr": 0.00014041867569130614, "time_ms": 2691.7901039123535, "eta_seconds": 6110.3635358810425, "eta": "1:41:50", "timestamp": 1765141294.6995118} +{"step": 7740, "loss": 3.3936939239501953, "lr": 0.0001397487633098294, "time_ms": 2690.5879974365234, "eta_seconds": 6080.728874206543, "eta": "1:41:20", "timestamp": 1765141321.6165802} +{"step": 7750, "loss": 3.562915802001953, "lr": 0.00013908116907963218, "time_ms": 2690.629482269287, "eta_seconds": 6053.916335105896, "eta": "1:40:53", "timestamp": 1765141348.5295749} +{"step": 7760, "loss": 3.35880708694458, "lr": 0.0001384159011351394, "time_ms": 2691.460609436035, "eta_seconds": 6028.871765136719, "eta": "1:40:28", "timestamp": 1765141375.4435241} +{"step": 7770, "loss": 3.366746425628662, "lr": 0.00013775296758243097, "time_ms": 2690.2525424957275, "eta_seconds": 5999.263169765472, "eta": "1:39:59", "timestamp": 1765141402.356633} +{"step": 7780, "loss": 3.409856081008911, "lr": 0.00013709237649914315, "time_ms": 2690.875291824341, "eta_seconds": 5973.743147850037, "eta": "1:39:33", "timestamp": 1765141429.268949} +{"step": 7790, "loss": 3.3415374755859375, "lr": 0.00013643413593436964, "time_ms": 2691.6069984436035, "eta_seconds": 5948.451466560364, "eta": "1:39:08", "timestamp": 1765141456.1850083} +{"step": 7800, "loss": 3.3486440181732178, "lr": 0.00013577825390856423, "time_ms": 2691.3890838623047, "eta_seconds": 5921.05598449707, "eta": "1:38:41", "timestamp": 1765141483.1036363} +{"step": 7810, "loss": 3.1951751708984375, "lr": 0.0001351247384134422, "time_ms": 2691.516399383545, "eta_seconds": 5894.420914649963, "eta": "1:38:14", "timestamp": 1765141510.0210352} +{"step": 7820, "loss": 3.3693692684173584, "lr": 0.00013447359741188382, "time_ms": 2691.084623336792, "eta_seconds": 5866.5644788742065, "eta": "1:37:46", "timestamp": 1765141536.9376667} +{"step": 7830, "loss": 3.2546303272247314, "lr": 0.0001338248388378365, "time_ms": 2691.5605068206787, "eta_seconds": 5840.686299800873, "eta": "1:37:20", "timestamp": 1765141563.8542676} +{"step": 7840, "loss": 3.4579989910125732, "lr": 0.00013317847059621894, "time_ms": 2690.566062927246, "eta_seconds": 5811.622695922852, "eta": "1:36:51", "timestamp": 1765141590.7714539} +{"step": 7850, "loss": 3.401890993118286, "lr": 0.00013253450056282395, "time_ms": 2690.831422805786, "eta_seconds": 5785.28755903244, "eta": "1:36:25", "timestamp": 1765141617.6867673} +{"step": 7860, "loss": 3.347987174987793, "lr": 0.00013189293658422333, "time_ms": 2689.586639404297, "eta_seconds": 5755.715408325195, "eta": "1:35:55", "timestamp": 1765141644.6018674} +{"step": 7870, "loss": 3.3840203285217285, "lr": 0.0001312537864776717, "time_ms": 2690.8791065216064, "eta_seconds": 5731.572496891022, "eta": "1:35:31", "timestamp": 1765141671.5174572} +{"step": 7880, "loss": 3.28843355178833, "lr": 0.00013061705803101134, "time_ms": 2691.223382949829, "eta_seconds": 5705.393571853638, "eta": "1:35:05", "timestamp": 1765141698.435167} +{"step": 7890, "loss": 3.3608944416046143, "lr": 0.00012998275900257748, "time_ms": 2691.2078857421875, "eta_seconds": 5678.448638916016, "eta": "1:34:38", "timestamp": 1765141725.3511522} +{"step": 7900, "loss": 3.3687992095947266, "lr": 0.0001293508971211035, "time_ms": 2690.704822540283, "eta_seconds": 5650.480127334595, "eta": "1:34:10", "timestamp": 1765141752.2651114} +{"step": 7910, "loss": 3.3455803394317627, "lr": 0.0001287214800856272, "time_ms": 2690.6023025512695, "eta_seconds": 5623.358812332153, "eta": "1:33:43", "timestamp": 1765141779.180939} +{"step": 7920, "loss": 3.3198509216308594, "lr": 0.00012809451556539643, "time_ms": 2691.392183303833, "eta_seconds": 5598.095741271973, "eta": "1:33:18", "timestamp": 1765141806.097743} +{"step": 7930, "loss": 3.398447275161743, "lr": 0.00012747001119977589, "time_ms": 2691.9941902160645, "eta_seconds": 5572.427973747253, "eta": "1:32:52", "timestamp": 1765141833.0136197} +{"step": 7940, "loss": 3.2872154712677, "lr": 0.00012684797459815443, "time_ms": 2691.2178993225098, "eta_seconds": 5543.90887260437, "eta": "1:32:23", "timestamp": 1765141859.9307036} +{"step": 7950, "loss": 3.2800357341766357, "lr": 0.00012622841333985153, "time_ms": 2691.1277770996094, "eta_seconds": 5516.811943054199, "eta": "1:31:56", "timestamp": 1765141886.8483515} +{"step": 7960, "loss": 3.199725866317749, "lr": 0.00012561133497402579, "time_ms": 2690.0768280029297, "eta_seconds": 5487.756729125977, "eta": "1:31:27", "timestamp": 1765141913.7641957} +{"step": 7970, "loss": 3.301370143890381, "lr": 0.00012499674701958217, "time_ms": 2690.7763481140137, "eta_seconds": 5462.275986671448, "eta": "1:31:02", "timestamp": 1765141940.679314} +{"step": 7980, "loss": 3.2861764430999756, "lr": 0.0001243846569650811, "time_ms": 2691.4966106414795, "eta_seconds": 5436.823153495789, "eta": "1:30:36", "timestamp": 1765141967.5965574} +{"step": 7990, "loss": 3.4885597229003906, "lr": 0.00012377507226864667, "time_ms": 2689.5124912261963, "eta_seconds": 5405.9201073646545, "eta": "1:30:05", "timestamp": 1765141994.511382} +{"step": 8000, "loss": 3.510509729385376, "lr": 0.00012316800035787594, "time_ms": 52807.03282356262, "eta_seconds": 105614.06564712524, "eta": "1 day, 5:20:14", "timestamp": 1765142071.5432765} +{"step": 8010, "loss": 3.4013826847076416, "lr": 0.00012256344862974873, "time_ms": 2689.6839141845703, "eta_seconds": 5352.470989227295, "eta": "1:29:12", "timestamp": 1765142098.440581} +{"step": 8020, "loss": 3.4684290885925293, "lr": 0.00012196142445053691, "time_ms": 2691.038131713867, "eta_seconds": 5328.255500793457, "eta": "1:28:48", "timestamp": 1765142125.346448} +{"step": 8030, "loss": 3.347038745880127, "lr": 0.00012136193515571521, "time_ms": 2690.9689903259277, "eta_seconds": 5301.208910942078, "eta": "1:28:21", "timestamp": 1765142152.2568727} +{"step": 8040, "loss": 3.3585739135742188, "lr": 0.00012076498804987152, "time_ms": 2691.214084625244, "eta_seconds": 5274.7796058654785, "eta": "1:27:54", "timestamp": 1765142179.1709368} +{"step": 8050, "loss": 3.3624343872070312, "lr": 0.00012017059040661784, "time_ms": 2691.6356086730957, "eta_seconds": 5248.689436912537, "eta": "1:27:28", "timestamp": 1765142206.0854137} +{"step": 8060, "loss": 3.3724749088287354, "lr": 0.00011957874946850192, "time_ms": 2690.6838417053223, "eta_seconds": 5219.926652908325, "eta": "1:26:59", "timestamp": 1765142233.0000045} +{"step": 8070, "loss": 3.2693450450897217, "lr": 0.0001189894724469189, "time_ms": 2690.4475688934326, "eta_seconds": 5192.563807964325, "eta": "1:26:32", "timestamp": 1765142259.910999} +{"step": 8080, "loss": 3.2794079780578613, "lr": 0.00011840276652202327, "time_ms": 2690.59157371521, "eta_seconds": 5165.935821533203, "eta": "1:26:05", "timestamp": 1765142286.8204944} +{"step": 8090, "loss": 3.492159366607666, "lr": 0.00011781863884264146, "time_ms": 2690.53316116333, "eta_seconds": 5138.91833782196, "eta": "1:25:38", "timestamp": 1765142313.7322109} +{"step": 8100, "loss": 3.399838924407959, "lr": 0.00011723709652618508, "time_ms": 2690.3929710388184, "eta_seconds": 5111.746644973755, "eta": "1:25:11", "timestamp": 1765142340.6437612} +{"step": 8110, "loss": 3.3023929595947266, "lr": 0.00011665814665856358, "time_ms": 2690.4168128967285, "eta_seconds": 5084.887776374817, "eta": "1:24:44", "timestamp": 1765142367.5543778} +{"step": 8120, "loss": 3.292243003845215, "lr": 0.00011608179629409853, "time_ms": 2691.1468505859375, "eta_seconds": 5059.3560791015625, "eta": "1:24:19", "timestamp": 1765142394.4649973} +{"step": 8130, "loss": 3.5050899982452393, "lr": 0.00011550805245543707, "time_ms": 2691.1561489105225, "eta_seconds": 5032.461998462677, "eta": "1:23:52", "timestamp": 1765142421.3773503} +{"step": 8140, "loss": 3.5275585651397705, "lr": 0.000114936922133467, "time_ms": 2690.9337043762207, "eta_seconds": 5005.1366901397705, "eta": "1:23:25", "timestamp": 1765142448.2886908} +{"step": 8150, "loss": 3.4321401119232178, "lr": 0.000114368412287231, "time_ms": 2691.71142578125, "eta_seconds": 4979.6661376953125, "eta": "1:22:59", "timestamp": 1765142475.201153} +{"step": 8160, "loss": 3.4114489555358887, "lr": 0.00011380252984384198, "time_ms": 2690.2613639831543, "eta_seconds": 4950.080909729004, "eta": "1:22:30", "timestamp": 1765142502.1131105} +{"step": 8170, "loss": 3.397610664367676, "lr": 0.00011323928169839912, "time_ms": 2690.804958343506, "eta_seconds": 4924.173073768616, "eta": "1:22:04", "timestamp": 1765142529.0227528} +{"step": 8180, "loss": 3.419696569442749, "lr": 0.00011267867471390319, "time_ms": 2691.0126209259033, "eta_seconds": 4897.642970085144, "eta": "1:21:37", "timestamp": 1765142555.9337213} +{"step": 8190, "loss": 3.304830551147461, "lr": 0.00011212071572117353, "time_ms": 2689.7382736206055, "eta_seconds": 4868.426275253296, "eta": "1:21:08", "timestamp": 1765142582.8464813} +{"step": 8200, "loss": 3.3216350078582764, "lr": 0.00011156541151876421, "time_ms": 2690.6561851501465, "eta_seconds": 4843.181133270264, "eta": "1:20:43", "timestamp": 1765142609.757757} +{"step": 8210, "loss": 3.3689510822296143, "lr": 0.00011101276887288185, "time_ms": 2689.540147781372, "eta_seconds": 4814.276864528656, "eta": "1:20:14", "timestamp": 1765142636.667398} +{"step": 8220, "loss": 3.364605188369751, "lr": 0.00011046279451730255, "time_ms": 2690.5579566955566, "eta_seconds": 4789.193162918091, "eta": "1:19:49", "timestamp": 1765142663.5756533} +{"step": 8230, "loss": 3.242360830307007, "lr": 0.00010991549515329033, "time_ms": 2690.559148788452, "eta_seconds": 4762.28969335556, "eta": "1:19:22", "timestamp": 1765142690.485409} +{"step": 8240, "loss": 3.3352532386779785, "lr": 0.0001093708774495153, "time_ms": 2689.6748542785645, "eta_seconds": 4733.827743530273, "eta": "1:18:53", "timestamp": 1765142717.3959346} +{"step": 8250, "loss": 3.3154122829437256, "lr": 0.00010882894804197218, "time_ms": 2690.901517868042, "eta_seconds": 4709.0776562690735, "eta": "1:18:29", "timestamp": 1765142744.307486} +{"step": 8260, "loss": 3.231806755065918, "lr": 0.0001082897135338999, "time_ms": 2689.7101402282715, "eta_seconds": 4680.095643997192, "eta": "1:18:00", "timestamp": 1765142771.2158332} +{"step": 8270, "loss": 3.411125421524048, "lr": 0.00010775318049570067, "time_ms": 2690.6166076660156, "eta_seconds": 4654.766731262207, "eta": "1:17:34", "timestamp": 1765142798.1254163} +{"step": 8280, "loss": 3.2329282760620117, "lr": 0.00010721935546486032, "time_ms": 2689.7847652435303, "eta_seconds": 4626.429796218872, "eta": "1:17:06", "timestamp": 1765142825.0338764} +{"step": 8290, "loss": 3.315493583679199, "lr": 0.00010668824494586827, "time_ms": 2691.032648086548, "eta_seconds": 4601.665828227997, "eta": "1:16:41", "timestamp": 1765142851.943724} +{"step": 8300, "loss": 3.3229782581329346, "lr": 0.00010615985541013876, "time_ms": 2689.962387084961, "eta_seconds": 4572.936058044434, "eta": "1:16:12", "timestamp": 1765142878.8539932} +{"step": 8310, "loss": 3.3469886779785156, "lr": 0.00010563419329593141, "time_ms": 2690.593481063843, "eta_seconds": 4547.102982997894, "eta": "1:15:47", "timestamp": 1765142905.7643256} +{"step": 8320, "loss": 3.349055051803589, "lr": 0.00010511126500827316, "time_ms": 2691.2500858306885, "eta_seconds": 4521.300144195557, "eta": "1:15:21", "timestamp": 1765142932.6780229} +{"step": 8330, "loss": 3.3976316452026367, "lr": 0.00010459107691888026, "time_ms": 2689.7189617156982, "eta_seconds": 4491.830666065216, "eta": "1:14:51", "timestamp": 1765142959.5886538} +{"step": 8340, "loss": 3.4126346111297607, "lr": 0.00010407363536608035, "time_ms": 2691.0805702209473, "eta_seconds": 4467.1937465667725, "eta": "1:14:27", "timestamp": 1765142986.497959} +{"step": 8350, "loss": 3.4419100284576416, "lr": 0.00010355894665473553, "time_ms": 2691.6825771331787, "eta_seconds": 4441.276252269745, "eta": "1:14:01", "timestamp": 1765143013.4111288} +{"step": 8360, "loss": 3.361856698989868, "lr": 0.00010304701705616525, "time_ms": 2690.382242202759, "eta_seconds": 4412.226877212524, "eta": "1:13:32", "timestamp": 1765143040.3209908} +{"step": 8370, "loss": 3.377951145172119, "lr": 0.00010253785280807019, "time_ms": 2690.328359603882, "eta_seconds": 4385.235226154327, "eta": "1:13:05", "timestamp": 1765143067.229381} +{"step": 8380, "loss": 3.4571197032928467, "lr": 0.00010203146011445599, "time_ms": 2689.945697784424, "eta_seconds": 4357.712030410767, "eta": "1:12:37", "timestamp": 1765143094.1393497} +{"step": 8390, "loss": 3.190080165863037, "lr": 0.00010152784514555775, "time_ms": 2691.4730072021484, "eta_seconds": 4333.271541595459, "eta": "1:12:13", "timestamp": 1765143121.0503879} +{"step": 8400, "loss": 3.383554697036743, "lr": 0.00010102701403776499, "time_ms": 2689.9354457855225, "eta_seconds": 4303.896713256836, "eta": "1:11:43", "timestamp": 1765143147.958026} +{"step": 8410, "loss": 3.3776726722717285, "lr": 0.00010052897289354677, "time_ms": 2690.4377937316895, "eta_seconds": 4277.796092033386, "eta": "1:11:17", "timestamp": 1765143174.867733} +{"step": 8420, "loss": 3.410266160964966, "lr": 0.00010003372778137712, "time_ms": 2690.28902053833, "eta_seconds": 4250.6566524505615, "eta": "1:10:50", "timestamp": 1765143201.7803087} +{"step": 8430, "loss": 3.374704122543335, "lr": 9.954128473566155e-05, "time_ms": 2691.314220428467, "eta_seconds": 4225.363326072693, "eta": "1:10:25", "timestamp": 1765143228.6917434} +{"step": 8440, "loss": 3.365989923477173, "lr": 9.905164975666321e-05, "time_ms": 2690.842866897583, "eta_seconds": 4197.7148723602295, "eta": "1:09:57", "timestamp": 1765143255.6011415} +{"step": 8450, "loss": 3.3367154598236084, "lr": 9.85648288104297e-05, "time_ms": 2690.8199787139893, "eta_seconds": 4170.770967006683, "eta": "1:09:30", "timestamp": 1765143282.5096643} +{"step": 8460, "loss": 3.393660306930542, "lr": 9.80808278287206e-05, "time_ms": 2690.160036087036, "eta_seconds": 4142.846455574036, "eta": "1:09:02", "timestamp": 1765143309.4169624} +{"step": 8470, "loss": 3.34236478805542, "lr": 9.759965270893524e-05, "time_ms": 2689.990282058716, "eta_seconds": 4115.685131549835, "eta": "1:08:35", "timestamp": 1765143336.3290691} +{"step": 8480, "loss": 3.288980722427368, "lr": 9.712130931404048e-05, "time_ms": 2690.6702518463135, "eta_seconds": 4089.8187828063965, "eta": "1:08:09", "timestamp": 1765143363.239859} +{"step": 8490, "loss": 3.38795804977417, "lr": 9.664580347249974e-05, "time_ms": 2689.586400985718, "eta_seconds": 4061.275465488434, "eta": "1:07:41", "timestamp": 1765143390.151873} +{"step": 8500, "loss": 3.3587489128112793, "lr": 9.617314097820154e-05, "time_ms": 50056.7889213562, "eta_seconds": 75085.1833820343, "eta": "20:51:25", "timestamp": 1765143464.4278038} +{"step": 8510, "loss": 3.409309148788452, "lr": 9.570332759038935e-05, "time_ms": 2690.657615661621, "eta_seconds": 4009.0798473358154, "eta": "1:06:49", "timestamp": 1765143491.3384542} +{"step": 8520, "loss": 3.4744555950164795, "lr": 9.523636903359086e-05, "time_ms": 2690.35005569458, "eta_seconds": 3981.7180824279785, "eta": "1:06:21", "timestamp": 1765143518.249051} +{"step": 8530, "loss": 3.303799867630005, "lr": 9.477227099754886e-05, "time_ms": 2689.422845840454, "eta_seconds": 3953.4515833854675, "eta": "1:05:53", "timestamp": 1765143545.1568255} +{"step": 8540, "loss": 3.3909847736358643, "lr": 9.431103913715142e-05, "time_ms": 2689.4264221191406, "eta_seconds": 3926.5625762939453, "eta": "1:05:26", "timestamp": 1765143572.0661223} +{"step": 8550, "loss": 3.2989492416381836, "lr": 9.385267907236314e-05, "time_ms": 2688.6818408966064, "eta_seconds": 3898.5886693000793, "eta": "1:04:58", "timestamp": 1765143598.967236} +{"step": 8560, "loss": 3.243168830871582, "lr": 9.339719638815689e-05, "time_ms": 2690.2079582214355, "eta_seconds": 3873.899459838867, "eta": "1:04:33", "timestamp": 1765143625.8752072} +{"step": 8570, "loss": 3.3418707847595215, "lr": 9.294459663444524e-05, "time_ms": 2690.1533603668213, "eta_seconds": 3846.9193053245544, "eta": "1:04:06", "timestamp": 1765143652.7832148} +{"step": 8580, "loss": 3.260011911392212, "lr": 9.249488532601358e-05, "time_ms": 2691.0927295684814, "eta_seconds": 3821.3516759872437, "eta": "1:03:41", "timestamp": 1765143679.6961155} +{"step": 8590, "loss": 3.4200499057769775, "lr": 9.20480679424521e-05, "time_ms": 2691.0765171051025, "eta_seconds": 3794.4178891181946, "eta": "1:03:14", "timestamp": 1765143706.6072495} +{"step": 8600, "loss": 3.4440009593963623, "lr": 9.16041499280897e-05, "time_ms": 2690.5856132507324, "eta_seconds": 3766.8198585510254, "eta": "1:02:46", "timestamp": 1765143733.5198185} +{"step": 8610, "loss": 3.3442983627319336, "lr": 9.116313669192733e-05, "time_ms": 2690.6862258911133, "eta_seconds": 3740.0538539886475, "eta": "1:02:20", "timestamp": 1765143760.4321253} +{"step": 8620, "loss": 3.365971565246582, "lr": 9.072503360757202e-05, "time_ms": 2692.046642303467, "eta_seconds": 3715.024366378784, "eta": "1:01:55", "timestamp": 1765143787.347133} +{"step": 8630, "loss": 3.153622627258301, "lr": 9.028984601317166e-05, "time_ms": 2690.237283706665, "eta_seconds": 3685.625078678131, "eta": "1:01:25", "timestamp": 1765143814.262085} +{"step": 8640, "loss": 3.3887555599212646, "lr": 8.985757921134966e-05, "time_ms": 2690.73748588562, "eta_seconds": 3659.4029808044434, "eta": "1:00:59", "timestamp": 1765143841.1750631} +{"step": 8650, "loss": 3.486097574234009, "lr": 8.942823846914069e-05, "time_ms": 2690.1230812072754, "eta_seconds": 3631.666159629822, "eta": "1:00:31", "timestamp": 1765143868.087896} +{"step": 8660, "loss": 3.2878191471099854, "lr": 8.900182901792608e-05, "time_ms": 2691.7150020599365, "eta_seconds": 3606.898102760315, "eta": "1:00:06", "timestamp": 1765143895.0026808} +{"step": 8670, "loss": 3.3771045207977295, "lr": 8.85783560533706e-05, "time_ms": 2691.115140914917, "eta_seconds": 3579.1831374168396, "eta": "0:59:39", "timestamp": 1765143921.9144099} +{"step": 8680, "loss": 3.2994155883789062, "lr": 8.815782473535851e-05, "time_ms": 2690.5598640441895, "eta_seconds": 3551.53902053833, "eta": "0:59:11", "timestamp": 1765143948.8260663} +{"step": 8690, "loss": 3.3699631690979004, "lr": 8.774024018793134e-05, "time_ms": 2690.713882446289, "eta_seconds": 3524.8351860046387, "eta": "0:58:44", "timestamp": 1765143975.7416425} +{"step": 8700, "loss": 3.4374184608459473, "lr": 8.732560749922495e-05, "time_ms": 2690.570831298828, "eta_seconds": 3497.7420806884766, "eta": "0:58:17", "timestamp": 1765144002.6519482} +{"step": 8710, "loss": 3.3896124362945557, "lr": 8.691393172140775e-05, "time_ms": 2689.120292663574, "eta_seconds": 3468.9651775360107, "eta": "0:57:48", "timestamp": 1765144029.5562959} +{"step": 8720, "loss": 3.2293946743011475, "lr": 8.65052178706193e-05, "time_ms": 2689.6586418151855, "eta_seconds": 3442.7630615234375, "eta": "0:57:22", "timestamp": 1765144056.453786} +{"step": 8730, "loss": 3.2661988735198975, "lr": 8.609947092690877e-05, "time_ms": 2691.1773681640625, "eta_seconds": 3417.7952575683594, "eta": "0:56:57", "timestamp": 1765144083.3631487} +{"step": 8740, "loss": 3.2970285415649414, "lr": 8.569669583417477e-05, "time_ms": 2691.1985874176025, "eta_seconds": 3390.910220146179, "eta": "0:56:30", "timestamp": 1765144110.2750328} +{"step": 8750, "loss": 3.466867208480835, "lr": 8.529689750010451e-05, "time_ms": 2691.352605819702, "eta_seconds": 3364.1907572746277, "eta": "0:56:04", "timestamp": 1765144137.1897147} +{"step": 8760, "loss": 3.0660409927368164, "lr": 8.490008079611468e-05, "time_ms": 2691.3857460021973, "eta_seconds": 3337.3183250427246, "eta": "0:55:37", "timestamp": 1765144164.1041923} +{"step": 8770, "loss": 3.3840668201446533, "lr": 8.45062505572915e-05, "time_ms": 2690.1464462280273, "eta_seconds": 3308.8801288604736, "eta": "0:55:08", "timestamp": 1765144191.018715} +{"step": 8780, "loss": 3.2500574588775635, "lr": 8.41154115823322e-05, "time_ms": 2691.279888153076, "eta_seconds": 3283.361463546753, "eta": "0:54:43", "timestamp": 1765144217.9304605} +{"step": 8790, "loss": 3.2973031997680664, "lr": 8.372756863348629e-05, "time_ms": 2691.8017864227295, "eta_seconds": 3257.0801615715027, "eta": "0:54:17", "timestamp": 1765144244.8447702} +{"step": 8800, "loss": 3.350229263305664, "lr": 8.334272643649774e-05, "time_ms": 2690.011739730835, "eta_seconds": 3228.014087677002, "eta": "0:53:48", "timestamp": 1765144271.7606108} +{"step": 8810, "loss": 3.306692361831665, "lr": 8.296088968054731e-05, "time_ms": 2690.187454223633, "eta_seconds": 3201.323070526123, "eta": "0:53:21", "timestamp": 1765144298.6739902} +{"step": 8820, "loss": 3.2704901695251465, "lr": 8.258206301819529e-05, "time_ms": 2690.011739730835, "eta_seconds": 3174.2138528823853, "eta": "0:52:54", "timestamp": 1765144325.5879424} +{"step": 8830, "loss": 3.3559107780456543, "lr": 8.220625106532508e-05, "time_ms": 2691.0314559936523, "eta_seconds": 3148.5068035125732, "eta": "0:52:28", "timestamp": 1765144352.4996324} +{"step": 8840, "loss": 3.190155029296875, "lr": 8.183345840108672e-05, "time_ms": 2691.0266876220703, "eta_seconds": 3121.5909576416016, "eta": "0:52:01", "timestamp": 1765144379.4140732} +{"step": 8850, "loss": 3.448669195175171, "lr": 8.14636895678411e-05, "time_ms": 2690.8040046691895, "eta_seconds": 3094.424605369568, "eta": "0:51:34", "timestamp": 1765144406.3291774} +{"step": 8860, "loss": 3.294142007827759, "lr": 8.109694907110489e-05, "time_ms": 2690.7005310058594, "eta_seconds": 3067.3986053466797, "eta": "0:51:07", "timestamp": 1765144433.241375} +{"step": 8870, "loss": 3.3672802448272705, "lr": 8.073324137949516e-05, "time_ms": 2690.0577545166016, "eta_seconds": 3039.7652626037598, "eta": "0:50:39", "timestamp": 1765144460.1525671} +{"step": 8880, "loss": 3.327383279800415, "lr": 8.037257092467548e-05, "time_ms": 2690.9737586975098, "eta_seconds": 3013.890609741211, "eta": "0:50:13", "timestamp": 1765144487.0630734} +{"step": 8890, "loss": 3.3358213901519775, "lr": 8.001494210130143e-05, "time_ms": 2690.3278827667236, "eta_seconds": 2986.2639498710632, "eta": "0:49:46", "timestamp": 1765144513.9756875} +{"step": 8900, "loss": 3.2487611770629883, "lr": 7.966035926696742e-05, "time_ms": 2690.4070377349854, "eta_seconds": 2959.447741508484, "eta": "0:49:19", "timestamp": 1765144540.8874497} +{"step": 8910, "loss": 3.3701391220092773, "lr": 7.930882674215335e-05, "time_ms": 2689.4524097442627, "eta_seconds": 2931.5031266212463, "eta": "0:48:51", "timestamp": 1765144567.7989552} +{"step": 8920, "loss": 3.3464550971984863, "lr": 7.896034881017214e-05, "time_ms": 2690.3719902038574, "eta_seconds": 2905.601749420166, "eta": "0:48:25", "timestamp": 1765144594.7102695} +{"step": 8930, "loss": 3.287585973739624, "lr": 7.86149297171174e-05, "time_ms": 2690.749406814575, "eta_seconds": 2879.1018652915955, "eta": "0:47:59", "timestamp": 1765144621.6255114} +{"step": 8940, "loss": 3.3739752769470215, "lr": 7.827257367181171e-05, "time_ms": 2690.541982650757, "eta_seconds": 2851.9745016098022, "eta": "0:47:31", "timestamp": 1765144648.537869} +{"step": 8950, "loss": 3.35949969291687, "lr": 7.793328484575556e-05, "time_ms": 2689.65482711792, "eta_seconds": 2824.137568473816, "eta": "0:47:04", "timestamp": 1765144675.4492328} +{"step": 8960, "loss": 3.350524425506592, "lr": 7.759706737307611e-05, "time_ms": 2690.2449131011963, "eta_seconds": 2797.854709625244, "eta": "0:46:37", "timestamp": 1765144702.3602793} +{"step": 8970, "loss": 3.3846492767333984, "lr": 7.726392535047721e-05, "time_ms": 2689.9728775024414, "eta_seconds": 2770.6720638275146, "eta": "0:46:10", "timestamp": 1765144729.2705336} +{"step": 8980, "loss": 3.2283291816711426, "lr": 7.69338628371893e-05, "time_ms": 2690.236806869507, "eta_seconds": 2744.041543006897, "eta": "0:45:44", "timestamp": 1765144756.1815174} +{"step": 8990, "loss": 3.3537302017211914, "lr": 7.66068838549199e-05, "time_ms": 2690.2143955230713, "eta_seconds": 2717.116539478302, "eta": "0:45:17", "timestamp": 1765144783.0938842} +{"step": 9000, "loss": 3.238189220428467, "lr": 7.628299238780476e-05, "time_ms": 50151.429891586304, "eta_seconds": 50151.429891586304, "eta": "13:55:51", "timestamp": 1765144857.4694958} +{"step": 9010, "loss": 3.321075201034546, "lr": 7.596219238235912e-05, "time_ms": 2690.6301975250244, "eta_seconds": 2663.723895549774, "eta": "0:44:23", "timestamp": 1765144884.3811572} +{"step": 9020, "loss": 3.368441581726074, "lr": 7.56444877474299e-05, "time_ms": 2690.4261112213135, "eta_seconds": 2636.617588996887, "eta": "0:43:56", "timestamp": 1765144911.292855} +{"step": 9030, "loss": 3.233717679977417, "lr": 7.532988235414774e-05, "time_ms": 2691.530704498291, "eta_seconds": 2610.7847833633423, "eta": "0:43:30", "timestamp": 1765144938.2058027} +{"step": 9040, "loss": 3.0437161922454834, "lr": 7.501838003588013e-05, "time_ms": 2690.9141540527344, "eta_seconds": 2583.277587890625, "eta": "0:43:03", "timestamp": 1765144965.1212626} +{"step": 9050, "loss": 3.3927624225616455, "lr": 7.470998458818445e-05, "time_ms": 2690.71626663208, "eta_seconds": 2556.180453300476, "eta": "0:42:36", "timestamp": 1765144992.0339315} +{"step": 9060, "loss": 3.1412177085876465, "lr": 7.440469976876201e-05, "time_ms": 2690.9077167510986, "eta_seconds": 2529.4532537460327, "eta": "0:42:09", "timestamp": 1765145018.9474924} +{"step": 9070, "loss": 3.400611162185669, "lr": 7.410252929741189e-05, "time_ms": 2691.2190914154053, "eta_seconds": 2502.833755016327, "eta": "0:41:42", "timestamp": 1765145045.8587904} +{"step": 9080, "loss": 3.325889825820923, "lr": 7.380347685598593e-05, "time_ms": 2691.059350967407, "eta_seconds": 2475.7746028900146, "eta": "0:41:15", "timestamp": 1765145072.774267} +{"step": 9090, "loss": 3.3158247470855713, "lr": 7.350754608834386e-05, "time_ms": 2690.5198097229004, "eta_seconds": 2448.3730268478394, "eta": "0:40:48", "timestamp": 1765145099.685419} +{"step": 9100, "loss": 3.1698713302612305, "lr": 7.321474060030854e-05, "time_ms": 2690.671920776367, "eta_seconds": 2421.6047286987305, "eta": "0:40:21", "timestamp": 1765145126.5987024} +{"step": 9110, "loss": 3.3236937522888184, "lr": 7.292506395962258e-05, "time_ms": 2691.5459632873535, "eta_seconds": 2395.4759073257446, "eta": "0:39:55", "timestamp": 1765145153.5127046} +{"step": 9120, "loss": 3.3959319591522217, "lr": 7.263851969590433e-05, "time_ms": 2690.4077529907227, "eta_seconds": 2367.558822631836, "eta": "0:39:27", "timestamp": 1765145180.424076} +{"step": 9130, "loss": 3.1804773807525635, "lr": 7.235511130060526e-05, "time_ms": 2691.3211345672607, "eta_seconds": 2341.449387073517, "eta": "0:39:01", "timestamp": 1765145207.338237} +{"step": 9140, "loss": 3.4528889656066895, "lr": 7.207484222696722e-05, "time_ms": 2691.3883686065674, "eta_seconds": 2314.593997001648, "eta": "0:38:34", "timestamp": 1765145234.2524323} +{"step": 9150, "loss": 3.412187099456787, "lr": 7.179771588998042e-05, "time_ms": 2691.922187805176, "eta_seconds": 2288.1338596343994, "eta": "0:38:08", "timestamp": 1765145261.1690712} +{"step": 9160, "loss": 3.291551113128662, "lr": 7.152373566634185e-05, "time_ms": 2692.4338340759277, "eta_seconds": 2261.6444206237793, "eta": "0:37:41", "timestamp": 1765145288.083003} +{"step": 9170, "loss": 3.3227102756500244, "lr": 7.125290489441403e-05, "time_ms": 2691.3366317749023, "eta_seconds": 2233.809404373169, "eta": "0:37:13", "timestamp": 1765145314.9997158} +{"step": 9180, "loss": 3.497157096862793, "lr": 7.098522687418448e-05, "time_ms": 2690.047264099121, "eta_seconds": 2205.8387565612793, "eta": "0:36:45", "timestamp": 1765145341.9133205} +{"step": 9190, "loss": 3.3776609897613525, "lr": 7.072070486722538e-05, "time_ms": 2690.613031387329, "eta_seconds": 2179.3965554237366, "eta": "0:36:19", "timestamp": 1765145368.8254082} +{"step": 9200, "loss": 3.4541120529174805, "lr": 7.04593420966539e-05, "time_ms": 2690.265893936157, "eta_seconds": 2152.212715148926, "eta": "0:35:52", "timestamp": 1765145395.736828} +{"step": 9210, "loss": 3.3831913471221924, "lr": 7.020114174709295e-05, "time_ms": 2690.6821727752686, "eta_seconds": 2125.638916492462, "eta": "0:35:25", "timestamp": 1765145422.6455042} +{"step": 9220, "loss": 3.3052053451538086, "lr": 6.994610696463231e-05, "time_ms": 2689.974069595337, "eta_seconds": 2098.179774284363, "eta": "0:34:58", "timestamp": 1765145449.5568812} +{"step": 9230, "loss": 3.3486926555633545, "lr": 6.96942408567903e-05, "time_ms": 2691.2832260131836, "eta_seconds": 2072.2880840301514, "eta": "0:34:32", "timestamp": 1765145476.4681933} +{"step": 9240, "loss": 3.3560941219329834, "lr": 6.944554649247592e-05, "time_ms": 2691.5979385375977, "eta_seconds": 2045.6144332885742, "eta": "0:34:05", "timestamp": 1765145503.378264} +{"step": 9250, "loss": 3.4633677005767822, "lr": 6.920002690195159e-05, "time_ms": 2689.979314804077, "eta_seconds": 2017.4844861030579, "eta": "0:33:37", "timestamp": 1765145530.2871575} +{"step": 9260, "loss": 3.3973076343536377, "lr": 6.895768507679596e-05, "time_ms": 2691.4148330688477, "eta_seconds": 1991.6469764709473, "eta": "0:33:11", "timestamp": 1765145557.2008674} +{"step": 9270, "loss": 3.443970203399658, "lr": 6.87185239698678e-05, "time_ms": 2689.2895698547363, "eta_seconds": 1963.1813859939575, "eta": "0:32:43", "timestamp": 1765145584.1106727} +{"step": 9280, "loss": 3.5234930515289307, "lr": 6.848254649526961e-05, "time_ms": 2691.1725997924805, "eta_seconds": 1937.644271850586, "eta": "0:32:17", "timestamp": 1765145611.019961} +{"step": 9290, "loss": 3.394359588623047, "lr": 6.824975552831251e-05, "time_ms": 2690.337657928467, "eta_seconds": 1910.1397371292114, "eta": "0:31:50", "timestamp": 1765145637.9292974} +{"step": 9300, "loss": 3.097745656967163, "lr": 6.802015390548096e-05, "time_ms": 2690.8953189849854, "eta_seconds": 1883.6267232894897, "eta": "0:31:23", "timestamp": 1765145664.841099} +{"step": 9310, "loss": 3.4809844493865967, "lr": 6.779374442439828e-05, "time_ms": 2690.831184387207, "eta_seconds": 1856.6735172271729, "eta": "0:30:56", "timestamp": 1765145691.754142} +{"step": 9320, "loss": 3.298445224761963, "lr": 6.757052984379253e-05, "time_ms": 2690.5364990234375, "eta_seconds": 1829.5648193359375, "eta": "0:30:29", "timestamp": 1765145718.6680684} +{"step": 9330, "loss": 3.285349130630493, "lr": 6.735051288346295e-05, "time_ms": 2690.944194793701, "eta_seconds": 1802.9326105117798, "eta": "0:30:02", "timestamp": 1765145745.5792248} +{"step": 9340, "loss": 3.2319021224975586, "lr": 6.713369622424672e-05, "time_ms": 2691.387414932251, "eta_seconds": 1776.3156938552856, "eta": "0:29:36", "timestamp": 1765145772.4948668} +{"step": 9350, "loss": 3.4492931365966797, "lr": 6.692008250798652e-05, "time_ms": 2691.1263465881348, "eta_seconds": 1749.2321252822876, "eta": "0:29:09", "timestamp": 1765145799.4110487} +{"step": 9360, "loss": 3.269191265106201, "lr": 6.670967433749792e-05, "time_ms": 2690.7882690429688, "eta_seconds": 1722.1044921875, "eta": "0:28:42", "timestamp": 1765145826.3243115} +{"step": 9370, "loss": 3.2780473232269287, "lr": 6.650247427653819e-05, "time_ms": 2690.3634071350098, "eta_seconds": 1694.9289464950562, "eta": "0:28:14", "timestamp": 1765145853.23687} +{"step": 9380, "loss": 3.2713801860809326, "lr": 6.629848484977466e-05, "time_ms": 2688.443183898926, "eta_seconds": 1666.834774017334, "eta": "0:27:46", "timestamp": 1765145880.1465743} +{"step": 9390, "loss": 3.4110066890716553, "lr": 6.609770854275412e-05, "time_ms": 2689.96262550354, "eta_seconds": 1640.8772015571594, "eta": "0:27:20", "timestamp": 1765145907.0601888} +{"step": 9400, "loss": 3.482130527496338, "lr": 6.590014780187247e-05, "time_ms": 2692.415952682495, "eta_seconds": 1615.449571609497, "eta": "0:26:55", "timestamp": 1765145933.9713614} +{"step": 9410, "loss": 3.3858838081359863, "lr": 6.570580503434505e-05, "time_ms": 2690.715551376343, "eta_seconds": 1587.5221753120422, "eta": "0:26:27", "timestamp": 1765145960.879309} +{"step": 9420, "loss": 3.330615758895874, "lr": 6.55146826081771e-05, "time_ms": 2690.448999404907, "eta_seconds": 1560.4604196548462, "eta": "0:26:00", "timestamp": 1765145987.7938142} +{"step": 9430, "loss": 3.3212339878082275, "lr": 6.532678285213513e-05, "time_ms": 2689.3038749694824, "eta_seconds": 1532.903208732605, "eta": "0:25:32", "timestamp": 1765146014.704986} +{"step": 9440, "loss": 3.349790096282959, "lr": 6.514210805571828e-05, "time_ms": 2690.1302337646484, "eta_seconds": 1506.4729309082031, "eta": "0:25:06", "timestamp": 1765146041.6152415} +{"step": 9450, "loss": 3.267841100692749, "lr": 6.496066046913072e-05, "time_ms": 2690.500259399414, "eta_seconds": 1479.7751426696777, "eta": "0:24:39", "timestamp": 1765146068.526422} +{"step": 9460, "loss": 3.396723985671997, "lr": 6.478244230325407e-05, "time_ms": 2690.5646324157715, "eta_seconds": 1452.9049015045166, "eta": "0:24:12", "timestamp": 1765146095.440053} +{"step": 9470, "loss": 3.2867977619171143, "lr": 6.460745572962038e-05, "time_ms": 2690.4075145721436, "eta_seconds": 1425.915982723236, "eta": "0:23:45", "timestamp": 1765146122.3517492} +{"step": 9480, "loss": 3.4188685417175293, "lr": 6.443570288038583e-05, "time_ms": 2692.270040512085, "eta_seconds": 1399.9804210662842, "eta": "0:23:19", "timestamp": 1765146149.2700443} +{"step": 9490, "loss": 3.0679399967193604, "lr": 6.42671858483047e-05, "time_ms": 2689.9805068969727, "eta_seconds": 1371.890058517456, "eta": "0:22:51", "timestamp": 1765146176.1795604} +{"step": 9500, "loss": 3.324418544769287, "lr": 6.410190668670384e-05, "time_ms": 52776.08513832092, "eta_seconds": 26388.04256916046, "eta": "7:19:48", "timestamp": 1765146253.1828957} +{"step": 9510, "loss": 3.340278387069702, "lr": 6.393986740945768e-05, "time_ms": 2687.2103214263916, "eta_seconds": 1316.7330574989319, "eta": "0:21:56", "timestamp": 1765146280.0550935} +{"step": 9520, "loss": 3.484975814819336, "lr": 6.378106999096369e-05, "time_ms": 2688.401460647583, "eta_seconds": 1290.4327011108398, "eta": "0:21:30", "timestamp": 1765146306.9392776} +{"step": 9530, "loss": 3.2023866176605225, "lr": 6.362551636611827e-05, "time_ms": 2689.185380935669, "eta_seconds": 1263.9171290397644, "eta": "0:21:03", "timestamp": 1765146333.8260663} +{"step": 9540, "loss": 3.3591413497924805, "lr": 6.347320843029327e-05, "time_ms": 2688.9917850494385, "eta_seconds": 1236.9362211227417, "eta": "0:20:36", "timestamp": 1765146360.7175539} +{"step": 9550, "loss": 3.2357943058013916, "lr": 6.332414803931283e-05, "time_ms": 2689.65220451355, "eta_seconds": 1210.3434920310974, "eta": "0:20:10", "timestamp": 1765146387.6077816} +{"step": 9560, "loss": 3.350475549697876, "lr": 6.317833700943075e-05, "time_ms": 2689.3861293792725, "eta_seconds": 1183.3298969268799, "eta": "0:19:43", "timestamp": 1765146414.499476} +{"step": 9570, "loss": 3.3136377334594727, "lr": 6.303577711730843e-05, "time_ms": 2689.45574760437, "eta_seconds": 1156.4659714698792, "eta": "0:19:16", "timestamp": 1765146441.391204} +{"step": 9580, "loss": 3.4145419597625732, "lr": 6.289647009999316e-05, "time_ms": 2688.781499862671, "eta_seconds": 1129.2882299423218, "eta": "0:18:49", "timestamp": 1765146468.2880764} +{"step": 9590, "loss": 3.3090322017669678, "lr": 6.276041765489697e-05, "time_ms": 2689.6684169769287, "eta_seconds": 1102.7640509605408, "eta": "0:18:22", "timestamp": 1765146495.1817966} +{"step": 9600, "loss": 3.3046224117279053, "lr": 6.2627621439776e-05, "time_ms": 2688.9405250549316, "eta_seconds": 1075.5762100219727, "eta": "0:17:55", "timestamp": 1765146522.0760531} +{"step": 9610, "loss": 3.4344797134399414, "lr": 6.249808307271023e-05, "time_ms": 2688.852310180664, "eta_seconds": 1048.652400970459, "eta": "0:17:28", "timestamp": 1765146548.9710443} +{"step": 9620, "loss": 3.264498710632324, "lr": 6.237180413208375e-05, "time_ms": 2688.2786750793457, "eta_seconds": 1021.5458965301514, "eta": "0:17:01", "timestamp": 1765146575.8618126} +{"step": 9630, "loss": 3.2657411098480225, "lr": 6.224878615656559e-05, "time_ms": 2689.856767654419, "eta_seconds": 995.247004032135, "eta": "0:16:35", "timestamp": 1765146602.7580612} +{"step": 9640, "loss": 3.3627946376800537, "lr": 6.2129030645091e-05, "time_ms": 2689.2547607421875, "eta_seconds": 968.1317138671875, "eta": "0:16:08", "timestamp": 1765146629.6517048} +{"step": 9650, "loss": 3.338411569595337, "lr": 6.201253905684307e-05, "time_ms": 2688.350200653076, "eta_seconds": 940.9225702285767, "eta": "0:15:40", "timestamp": 1765146656.5476153} +{"step": 9660, "loss": 3.272153615951538, "lr": 6.189931281123503e-05, "time_ms": 2688.8375282287598, "eta_seconds": 914.2047595977783, "eta": "0:15:14", "timestamp": 1765146683.4454076} +{"step": 9670, "loss": 3.3755619525909424, "lr": 6.178935328789296e-05, "time_ms": 2689.8062229156494, "eta_seconds": 887.6360535621643, "eta": "0:14:47", "timestamp": 1765146710.3408399} +{"step": 9680, "loss": 3.3868374824523926, "lr": 6.168266182663898e-05, "time_ms": 2688.807725906372, "eta_seconds": 860.4184722900391, "eta": "0:14:20", "timestamp": 1765146737.2336738} +{"step": 9690, "loss": 3.292916774749756, "lr": 6.157923972747485e-05, "time_ms": 2688.793897628784, "eta_seconds": 833.5261082649231, "eta": "0:13:53", "timestamp": 1765146764.1257758} +{"step": 9700, "loss": 3.240556478500366, "lr": 6.147908825056621e-05, "time_ms": 2688.258171081543, "eta_seconds": 806.4774513244629, "eta": "0:13:26", "timestamp": 1765146791.0214467} +{"step": 9710, "loss": 3.2629811763763428, "lr": 6.138220861622719e-05, "time_ms": 2688.965082168579, "eta_seconds": 779.7998738288879, "eta": "0:12:59", "timestamp": 1765146817.9157} +{"step": 9720, "loss": 3.2918541431427, "lr": 6.128860200490559e-05, "time_ms": 2689.4314289093018, "eta_seconds": 753.0408000946045, "eta": "0:12:33", "timestamp": 1765146844.8130531} +{"step": 9730, "loss": 3.195098400115967, "lr": 6.119826955716841e-05, "time_ms": 2688.084602355957, "eta_seconds": 725.7828426361084, "eta": "0:12:05", "timestamp": 1765146871.7054849} +{"step": 9740, "loss": 3.337319850921631, "lr": 6.111121237368802e-05, "time_ms": 2689.401865005493, "eta_seconds": 699.2444849014282, "eta": "0:11:39", "timestamp": 1765146898.6025329} +{"step": 9750, "loss": 3.221512794494629, "lr": 6.1027431515228704e-05, "time_ms": 2689.9352073669434, "eta_seconds": 672.4838018417358, "eta": "0:11:12", "timestamp": 1765146925.4973016} +{"step": 9760, "loss": 3.3094615936279297, "lr": 6.094692800263382e-05, "time_ms": 2689.04972076416, "eta_seconds": 645.3719329833984, "eta": "0:10:45", "timestamp": 1765146952.3899589} +{"step": 9770, "loss": 3.2300150394439697, "lr": 6.0869702816813275e-05, "time_ms": 2689.7895336151123, "eta_seconds": 618.6515927314758, "eta": "0:10:18", "timestamp": 1765146979.2841277} +{"step": 9780, "loss": 3.306036949157715, "lr": 6.079575689873153e-05, "time_ms": 2689.4164085388184, "eta_seconds": 591.67160987854, "eta": "0:09:51", "timestamp": 1765147006.1775029} +{"step": 9790, "loss": 3.3454127311706543, "lr": 6.072509114939632e-05, "time_ms": 2689.775228500366, "eta_seconds": 564.8527979850769, "eta": "0:09:24", "timestamp": 1765147033.071847} +{"step": 9800, "loss": 3.304492473602295, "lr": 6.0657706429847466e-05, "time_ms": 2689.2566680908203, "eta_seconds": 537.8513336181641, "eta": "0:08:57", "timestamp": 1765147059.968857} +{"step": 9810, "loss": 3.455810070037842, "lr": 6.059360356114651e-05, "time_ms": 2688.8973712921143, "eta_seconds": 510.8905005455017, "eta": "0:08:30", "timestamp": 1765147086.862959} +{"step": 9820, "loss": 3.4776737689971924, "lr": 6.053278332436668e-05, "time_ms": 2689.0103816986084, "eta_seconds": 484.0218687057495, "eta": "0:08:04", "timestamp": 1765147113.7565496} +{"step": 9830, "loss": 3.3366410732269287, "lr": 6.0475246460583366e-05, "time_ms": 2689.279794692993, "eta_seconds": 457.17756509780884, "eta": "0:07:37", "timestamp": 1765147140.6531205} +{"step": 9840, "loss": 3.3179469108581543, "lr": 6.042099367086513e-05, "time_ms": 2689.0907287597656, "eta_seconds": 430.2545166015625, "eta": "0:07:10", "timestamp": 1765147167.5458026} +{"step": 9850, "loss": 3.3535568714141846, "lr": 6.037002561626506e-05, "time_ms": 2688.7810230255127, "eta_seconds": 403.3171534538269, "eta": "0:06:43", "timestamp": 1765147194.4385083} +{"step": 9860, "loss": 3.3613433837890625, "lr": 6.032234291781283e-05, "time_ms": 2688.74454498291, "eta_seconds": 376.4242362976074, "eta": "0:06:16", "timestamp": 1765147221.3307095} +{"step": 9870, "loss": 3.483717918395996, "lr": 6.027794615650705e-05, "time_ms": 2689.3749237060547, "eta_seconds": 349.6187400817871, "eta": "0:05:49", "timestamp": 1765147248.2211068} +{"step": 9880, "loss": 3.388702154159546, "lr": 6.0236835873308236e-05, "time_ms": 2689.330816268921, "eta_seconds": 322.7196979522705, "eta": "0:05:22", "timestamp": 1765147275.1128876} +{"step": 9890, "loss": 3.3678600788116455, "lr": 6.019901256913229e-05, "time_ms": 2688.1558895111084, "eta_seconds": 295.6971478462219, "eta": "0:04:55", "timestamp": 1765147302.003117} +{"step": 9900, "loss": 3.2922918796539307, "lr": 6.0164476704844146e-05, "time_ms": 2688.1864070892334, "eta_seconds": 268.81864070892334, "eta": "0:04:28", "timestamp": 1765147328.8951654} +{"step": 9910, "loss": 3.3373093605041504, "lr": 6.013322870125247e-05, "time_ms": 2689.406394958496, "eta_seconds": 242.04657554626465, "eta": "0:04:02", "timestamp": 1765147355.7884636} +{"step": 9920, "loss": 3.38280987739563, "lr": 6.0105268939104325e-05, "time_ms": 2688.615322113037, "eta_seconds": 215.08922576904297, "eta": "0:03:35", "timestamp": 1765147382.6790795} +{"step": 9930, "loss": 3.2267403602600098, "lr": 6.008059775908056e-05, "time_ms": 2688.2388591766357, "eta_seconds": 188.1767201423645, "eta": "0:03:08", "timestamp": 1765147409.5703785} +{"step": 9940, "loss": 3.354172945022583, "lr": 6.0059215461791714e-05, "time_ms": 2689.608335494995, "eta_seconds": 161.3765001296997, "eta": "0:02:41", "timestamp": 1765147436.464254} +{"step": 9950, "loss": 3.312748670578003, "lr": 6.004112230777436e-05, "time_ms": 2687.5503063201904, "eta_seconds": 134.37751531600952, "eta": "0:02:14", "timestamp": 1765147463.3538563} +{"step": 9960, "loss": 3.3858091831207275, "lr": 6.0026318517487855e-05, "time_ms": 2689.098119735718, "eta_seconds": 107.56392478942871, "eta": "0:01:47", "timestamp": 1765147490.2437391} +{"step": 9970, "loss": 3.364229440689087, "lr": 6.0014804271311725e-05, "time_ms": 2688.302755355835, "eta_seconds": 80.64908266067505, "eta": "0:01:20", "timestamp": 1765147517.1327198} +{"step": 9980, "loss": 3.2903707027435303, "lr": 6.000657970954342e-05, "time_ms": 2687.347412109375, "eta_seconds": 53.7469482421875, "eta": "0:00:53", "timestamp": 1765147544.021121} +{"step": 9990, "loss": 3.2541794776916504, "lr": 6.0001644932396594e-05, "time_ms": 2687.5641345977783, "eta_seconds": 26.875641345977783, "eta": "0:00:26", "timestamp": 1765147570.9073985}