bespoke_stratos_32B / trainer_log.jsonl
neginr's picture
Training in progress, epoch 0
50abb8c verified
{"current_steps": 1, "total_steps": 650, "loss": 0.786, "lr": 6.153846153846155e-07, "epoch": 0.007655502392344498, "percentage": 0.15, "elapsed_time": "0:01:50", "remaining_time": "19:55:39"}
{"current_steps": 2, "total_steps": 650, "loss": 0.8334, "lr": 1.230769230769231e-06, "epoch": 0.015311004784688996, "percentage": 0.31, "elapsed_time": "0:03:39", "remaining_time": "19:46:57"}
{"current_steps": 3, "total_steps": 650, "loss": 0.8015, "lr": 1.8461538461538465e-06, "epoch": 0.022966507177033493, "percentage": 0.46, "elapsed_time": "0:05:09", "remaining_time": "18:33:39"}
{"current_steps": 4, "total_steps": 650, "loss": 0.8098, "lr": 2.461538461538462e-06, "epoch": 0.03062200956937799, "percentage": 0.62, "elapsed_time": "0:06:48", "remaining_time": "18:20:14"}
{"current_steps": 5, "total_steps": 650, "loss": 0.784, "lr": 3.0769230769230774e-06, "epoch": 0.03827751196172249, "percentage": 0.77, "elapsed_time": "0:08:13", "remaining_time": "17:40:02"}
{"current_steps": 6, "total_steps": 650, "loss": 0.7565, "lr": 3.692307692307693e-06, "epoch": 0.045933014354066985, "percentage": 0.92, "elapsed_time": "0:10:06", "remaining_time": "18:04:13"}
{"current_steps": 7, "total_steps": 650, "loss": 0.7147, "lr": 4.307692307692308e-06, "epoch": 0.053588516746411484, "percentage": 1.08, "elapsed_time": "0:11:43", "remaining_time": "17:56:57"}
{"current_steps": 8, "total_steps": 650, "loss": 0.7361, "lr": 4.923076923076924e-06, "epoch": 0.06124401913875598, "percentage": 1.23, "elapsed_time": "0:13:41", "remaining_time": "18:18:06"}
{"current_steps": 9, "total_steps": 650, "loss": 0.6639, "lr": 5.538461538461539e-06, "epoch": 0.06889952153110047, "percentage": 1.38, "elapsed_time": "0:15:28", "remaining_time": "18:22:07"}
{"current_steps": 10, "total_steps": 650, "loss": 0.6813, "lr": 6.153846153846155e-06, "epoch": 0.07655502392344497, "percentage": 1.54, "elapsed_time": "0:17:16", "remaining_time": "18:25:20"}
{"current_steps": 11, "total_steps": 650, "loss": 0.6701, "lr": 6.76923076923077e-06, "epoch": 0.08421052631578947, "percentage": 1.69, "elapsed_time": "0:18:47", "remaining_time": "18:11:10"}
{"current_steps": 12, "total_steps": 650, "loss": 0.6234, "lr": 7.384615384615386e-06, "epoch": 0.09186602870813397, "percentage": 1.85, "elapsed_time": "0:20:37", "remaining_time": "18:16:52"}
{"current_steps": 13, "total_steps": 650, "loss": 0.6053, "lr": 8.000000000000001e-06, "epoch": 0.09952153110047847, "percentage": 2.0, "elapsed_time": "0:22:23", "remaining_time": "18:16:56"}
{"current_steps": 14, "total_steps": 650, "loss": 0.5654, "lr": 8.615384615384617e-06, "epoch": 0.10717703349282297, "percentage": 2.15, "elapsed_time": "0:24:14", "remaining_time": "18:20:56"}
{"current_steps": 15, "total_steps": 650, "loss": 0.5755, "lr": 9.230769230769232e-06, "epoch": 0.11483253588516747, "percentage": 2.31, "elapsed_time": "0:25:58", "remaining_time": "18:19:37"}
{"current_steps": 16, "total_steps": 650, "loss": 0.5421, "lr": 9.846153846153848e-06, "epoch": 0.12248803827751197, "percentage": 2.46, "elapsed_time": "0:27:45", "remaining_time": "18:19:47"}
{"current_steps": 17, "total_steps": 650, "loss": 0.5455, "lr": 1.0461538461538463e-05, "epoch": 0.13014354066985645, "percentage": 2.62, "elapsed_time": "0:29:22", "remaining_time": "18:13:34"}
{"current_steps": 18, "total_steps": 650, "loss": 0.5357, "lr": 1.1076923076923079e-05, "epoch": 0.13779904306220095, "percentage": 2.77, "elapsed_time": "0:31:15", "remaining_time": "18:17:23"}
{"current_steps": 19, "total_steps": 650, "loss": 0.5377, "lr": 1.1692307692307694e-05, "epoch": 0.14545454545454545, "percentage": 2.92, "elapsed_time": "0:33:06", "remaining_time": "18:19:30"}
{"current_steps": 20, "total_steps": 650, "loss": 0.5208, "lr": 1.230769230769231e-05, "epoch": 0.15311004784688995, "percentage": 3.08, "elapsed_time": "0:34:52", "remaining_time": "18:18:37"}
{"current_steps": 21, "total_steps": 650, "loss": 0.5243, "lr": 1.2923076923076925e-05, "epoch": 0.16076555023923444, "percentage": 3.23, "elapsed_time": "0:36:44", "remaining_time": "18:20:36"}
{"current_steps": 22, "total_steps": 650, "loss": 0.5012, "lr": 1.353846153846154e-05, "epoch": 0.16842105263157894, "percentage": 3.38, "elapsed_time": "0:38:25", "remaining_time": "18:16:46"}
{"current_steps": 23, "total_steps": 650, "loss": 0.4949, "lr": 1.4153846153846156e-05, "epoch": 0.17607655502392344, "percentage": 3.54, "elapsed_time": "0:40:39", "remaining_time": "18:28:17"}
{"current_steps": 24, "total_steps": 650, "loss": 0.4827, "lr": 1.4769230769230772e-05, "epoch": 0.18373205741626794, "percentage": 3.69, "elapsed_time": "0:42:08", "remaining_time": "18:19:00"}
{"current_steps": 25, "total_steps": 650, "loss": 0.5033, "lr": 1.5384615384615387e-05, "epoch": 0.19138755980861244, "percentage": 3.85, "elapsed_time": "0:43:49", "remaining_time": "18:15:41"}
{"current_steps": 26, "total_steps": 650, "loss": 0.5004, "lr": 1.6000000000000003e-05, "epoch": 0.19904306220095694, "percentage": 4.0, "elapsed_time": "0:45:29", "remaining_time": "18:11:48"}
{"current_steps": 27, "total_steps": 650, "loss": 0.4806, "lr": 1.6615384615384618e-05, "epoch": 0.20669856459330144, "percentage": 4.15, "elapsed_time": "0:47:30", "remaining_time": "18:16:08"}
{"current_steps": 28, "total_steps": 650, "loss": 0.4838, "lr": 1.7230769230769234e-05, "epoch": 0.21435406698564594, "percentage": 4.31, "elapsed_time": "0:49:37", "remaining_time": "18:22:28"}
{"current_steps": 29, "total_steps": 650, "loss": 0.4766, "lr": 1.784615384615385e-05, "epoch": 0.22200956937799043, "percentage": 4.46, "elapsed_time": "0:51:42", "remaining_time": "18:27:19"}
{"current_steps": 30, "total_steps": 650, "loss": 0.4568, "lr": 1.8461538461538465e-05, "epoch": 0.22966507177033493, "percentage": 4.62, "elapsed_time": "0:53:30", "remaining_time": "18:25:49"}
{"current_steps": 31, "total_steps": 650, "loss": 0.4837, "lr": 1.907692307692308e-05, "epoch": 0.23732057416267943, "percentage": 4.77, "elapsed_time": "0:55:20", "remaining_time": "18:25:11"}
{"current_steps": 32, "total_steps": 650, "loss": 0.4605, "lr": 1.9692307692307696e-05, "epoch": 0.24497607655502393, "percentage": 4.92, "elapsed_time": "0:57:35", "remaining_time": "18:32:20"}
{"current_steps": 33, "total_steps": 650, "loss": 0.4855, "lr": 2.0307692307692308e-05, "epoch": 0.25263157894736843, "percentage": 5.08, "elapsed_time": "0:59:39", "remaining_time": "18:35:34"}
{"current_steps": 34, "total_steps": 650, "loss": 0.4565, "lr": 2.0923076923076927e-05, "epoch": 0.2602870813397129, "percentage": 5.23, "elapsed_time": "1:01:31", "remaining_time": "18:34:47"}
{"current_steps": 35, "total_steps": 650, "loss": 0.459, "lr": 2.153846153846154e-05, "epoch": 0.2679425837320574, "percentage": 5.38, "elapsed_time": "1:03:39", "remaining_time": "18:38:25"}
{"current_steps": 36, "total_steps": 650, "loss": 0.4548, "lr": 2.2153846153846158e-05, "epoch": 0.2755980861244019, "percentage": 5.54, "elapsed_time": "1:05:31", "remaining_time": "18:37:32"}
{"current_steps": 37, "total_steps": 650, "loss": 0.4683, "lr": 2.276923076923077e-05, "epoch": 0.2832535885167464, "percentage": 5.69, "elapsed_time": "1:07:42", "remaining_time": "18:41:48"}
{"current_steps": 38, "total_steps": 650, "loss": 0.4346, "lr": 2.338461538461539e-05, "epoch": 0.2909090909090909, "percentage": 5.85, "elapsed_time": "1:09:32", "remaining_time": "18:39:57"}
{"current_steps": 39, "total_steps": 650, "loss": 0.4391, "lr": 2.4e-05, "epoch": 0.2985645933014354, "percentage": 6.0, "elapsed_time": "1:11:27", "remaining_time": "18:39:30"}
{"current_steps": 40, "total_steps": 650, "loss": 0.4383, "lr": 2.461538461538462e-05, "epoch": 0.3062200956937799, "percentage": 6.15, "elapsed_time": "1:13:07", "remaining_time": "18:35:15"}
{"current_steps": 41, "total_steps": 650, "loss": 0.4456, "lr": 2.523076923076923e-05, "epoch": 0.3138755980861244, "percentage": 6.31, "elapsed_time": "1:15:02", "remaining_time": "18:34:33"}
{"current_steps": 42, "total_steps": 650, "loss": 0.4231, "lr": 2.584615384615385e-05, "epoch": 0.3215311004784689, "percentage": 6.46, "elapsed_time": "1:16:53", "remaining_time": "18:33:05"}
{"current_steps": 43, "total_steps": 650, "loss": 0.4415, "lr": 2.6461538461538463e-05, "epoch": 0.3291866028708134, "percentage": 6.62, "elapsed_time": "1:18:43", "remaining_time": "18:31:24"}
{"current_steps": 44, "total_steps": 650, "loss": 0.4319, "lr": 2.707692307692308e-05, "epoch": 0.3368421052631579, "percentage": 6.77, "elapsed_time": "1:20:44", "remaining_time": "18:31:57"}
{"current_steps": 45, "total_steps": 650, "loss": 0.4229, "lr": 2.7692307692307694e-05, "epoch": 0.3444976076555024, "percentage": 6.92, "elapsed_time": "1:22:26", "remaining_time": "18:28:27"}
{"current_steps": 46, "total_steps": 650, "loss": 0.454, "lr": 2.8307692307692312e-05, "epoch": 0.3521531100478469, "percentage": 7.08, "elapsed_time": "1:24:43", "remaining_time": "18:32:24"}
{"current_steps": 47, "total_steps": 650, "loss": 0.4439, "lr": 2.8923076923076925e-05, "epoch": 0.3598086124401914, "percentage": 7.23, "elapsed_time": "1:26:36", "remaining_time": "18:31:03"}
{"current_steps": 48, "total_steps": 650, "loss": 0.4338, "lr": 2.9538461538461543e-05, "epoch": 0.3674641148325359, "percentage": 7.38, "elapsed_time": "1:28:23", "remaining_time": "18:28:39"}
{"current_steps": 49, "total_steps": 650, "loss": 0.433, "lr": 3.0153846153846155e-05, "epoch": 0.3751196172248804, "percentage": 7.54, "elapsed_time": "1:30:09", "remaining_time": "18:25:52"}
{"current_steps": 50, "total_steps": 650, "loss": 0.4277, "lr": 3.0769230769230774e-05, "epoch": 0.3827751196172249, "percentage": 7.69, "elapsed_time": "1:31:34", "remaining_time": "18:18:49"}
{"current_steps": 51, "total_steps": 650, "loss": 0.4258, "lr": 3.1384615384615386e-05, "epoch": 0.39043062200956935, "percentage": 7.85, "elapsed_time": "1:33:19", "remaining_time": "18:16:07"}
{"current_steps": 52, "total_steps": 650, "loss": 0.4118, "lr": 3.2000000000000005e-05, "epoch": 0.3980861244019139, "percentage": 8.0, "elapsed_time": "1:35:28", "remaining_time": "18:18:00"}
{"current_steps": 53, "total_steps": 650, "loss": 0.4209, "lr": 3.261538461538462e-05, "epoch": 0.40574162679425835, "percentage": 8.15, "elapsed_time": "1:37:05", "remaining_time": "18:13:40"}
{"current_steps": 54, "total_steps": 650, "loss": 0.4033, "lr": 3.3230769230769236e-05, "epoch": 0.4133971291866029, "percentage": 8.31, "elapsed_time": "1:38:43", "remaining_time": "18:09:33"}
{"current_steps": 55, "total_steps": 650, "loss": 0.4298, "lr": 3.384615384615385e-05, "epoch": 0.42105263157894735, "percentage": 8.46, "elapsed_time": "1:40:36", "remaining_time": "18:08:18"}
{"current_steps": 56, "total_steps": 650, "loss": 0.4411, "lr": 3.446153846153847e-05, "epoch": 0.42870813397129187, "percentage": 8.62, "elapsed_time": "1:42:26", "remaining_time": "18:06:33"}
{"current_steps": 57, "total_steps": 650, "loss": 0.4218, "lr": 3.507692307692308e-05, "epoch": 0.43636363636363634, "percentage": 8.77, "elapsed_time": "1:44:31", "remaining_time": "18:07:21"}
{"current_steps": 58, "total_steps": 650, "loss": 0.4322, "lr": 3.56923076923077e-05, "epoch": 0.44401913875598087, "percentage": 8.92, "elapsed_time": "1:46:22", "remaining_time": "18:05:44"}
{"current_steps": 59, "total_steps": 650, "loss": 0.4277, "lr": 3.630769230769231e-05, "epoch": 0.45167464114832534, "percentage": 9.08, "elapsed_time": "1:48:30", "remaining_time": "18:06:57"}
{"current_steps": 60, "total_steps": 650, "loss": 0.4285, "lr": 3.692307692307693e-05, "epoch": 0.45933014354066987, "percentage": 9.23, "elapsed_time": "1:50:45", "remaining_time": "18:09:11"}
{"current_steps": 61, "total_steps": 650, "loss": 0.4111, "lr": 3.753846153846154e-05, "epoch": 0.46698564593301434, "percentage": 9.38, "elapsed_time": "1:52:28", "remaining_time": "18:06:03"}
{"current_steps": 62, "total_steps": 650, "loss": 0.426, "lr": 3.815384615384616e-05, "epoch": 0.47464114832535886, "percentage": 9.54, "elapsed_time": "1:54:36", "remaining_time": "18:06:52"}
{"current_steps": 63, "total_steps": 650, "loss": 0.4261, "lr": 3.876923076923077e-05, "epoch": 0.48229665071770333, "percentage": 9.69, "elapsed_time": "1:56:08", "remaining_time": "18:02:04"}
{"current_steps": 64, "total_steps": 650, "loss": 0.4169, "lr": 3.938461538461539e-05, "epoch": 0.48995215311004786, "percentage": 9.85, "elapsed_time": "1:57:53", "remaining_time": "17:59:27"}
{"current_steps": 65, "total_steps": 650, "loss": 0.4214, "lr": 4e-05, "epoch": 0.49760765550239233, "percentage": 10.0, "elapsed_time": "1:59:40", "remaining_time": "17:57:01"}
{"current_steps": 66, "total_steps": 650, "loss": 0.4192, "lr": 3.999971160550277e-05, "epoch": 0.5052631578947369, "percentage": 10.15, "elapsed_time": "2:01:48", "remaining_time": "17:57:51"}
{"current_steps": 67, "total_steps": 650, "loss": 0.42, "lr": 3.999884643032821e-05, "epoch": 0.5129186602870813, "percentage": 10.31, "elapsed_time": "2:03:45", "remaining_time": "17:56:54"}
{"current_steps": 68, "total_steps": 650, "loss": 0.4175, "lr": 3.9997404499427494e-05, "epoch": 0.5205741626794258, "percentage": 10.46, "elapsed_time": "2:05:36", "remaining_time": "17:55:01"}
{"current_steps": 69, "total_steps": 650, "loss": 0.4114, "lr": 3.9995385854385124e-05, "epoch": 0.5282296650717704, "percentage": 10.62, "elapsed_time": "2:07:44", "remaining_time": "17:55:35"}
{"current_steps": 70, "total_steps": 650, "loss": 0.4058, "lr": 3.999279055341771e-05, "epoch": 0.5358851674641149, "percentage": 10.77, "elapsed_time": "2:09:33", "remaining_time": "17:53:29"}
{"current_steps": 71, "total_steps": 650, "loss": 0.4211, "lr": 3.9989618671372304e-05, "epoch": 0.5435406698564593, "percentage": 10.92, "elapsed_time": "2:11:16", "remaining_time": "17:50:30"}
{"current_steps": 72, "total_steps": 650, "loss": 0.4337, "lr": 3.998587029972423e-05, "epoch": 0.5511961722488038, "percentage": 11.08, "elapsed_time": "2:13:07", "remaining_time": "17:48:38"}
{"current_steps": 73, "total_steps": 650, "loss": 0.4239, "lr": 3.998154554657448e-05, "epoch": 0.5588516746411484, "percentage": 11.23, "elapsed_time": "2:15:00", "remaining_time": "17:47:06"}
{"current_steps": 74, "total_steps": 650, "loss": 0.418, "lr": 3.997664453664654e-05, "epoch": 0.5665071770334928, "percentage": 11.38, "elapsed_time": "2:16:40", "remaining_time": "17:43:50"}
{"current_steps": 75, "total_steps": 650, "loss": 0.4138, "lr": 3.9971167411282835e-05, "epoch": 0.5741626794258373, "percentage": 11.54, "elapsed_time": "2:18:13", "remaining_time": "17:39:46"}
{"current_steps": 76, "total_steps": 650, "loss": 0.4206, "lr": 3.996511432844067e-05, "epoch": 0.5818181818181818, "percentage": 11.69, "elapsed_time": "2:20:06", "remaining_time": "17:38:09"}
{"current_steps": 77, "total_steps": 650, "loss": 0.4095, "lr": 3.9958485462687606e-05, "epoch": 0.5894736842105263, "percentage": 11.85, "elapsed_time": "2:21:52", "remaining_time": "17:35:48"}
{"current_steps": 78, "total_steps": 650, "loss": 0.4155, "lr": 3.9951281005196486e-05, "epoch": 0.5971291866028708, "percentage": 12.0, "elapsed_time": "2:23:51", "remaining_time": "17:34:57"}
{"current_steps": 79, "total_steps": 650, "loss": 0.4244, "lr": 3.994350116373991e-05, "epoch": 0.6047846889952153, "percentage": 12.15, "elapsed_time": "2:25:14", "remaining_time": "17:29:47"}
{"current_steps": 80, "total_steps": 650, "loss": 0.4314, "lr": 3.9935146162684206e-05, "epoch": 0.6124401913875598, "percentage": 12.31, "elapsed_time": "2:26:57", "remaining_time": "17:27:07"}
{"current_steps": 81, "total_steps": 650, "loss": 0.4143, "lr": 3.9926216242983017e-05, "epoch": 0.6200956937799043, "percentage": 12.46, "elapsed_time": "2:28:42", "remaining_time": "17:24:35"}
{"current_steps": 82, "total_steps": 650, "loss": 0.4076, "lr": 3.991671166217031e-05, "epoch": 0.6277511961722488, "percentage": 12.62, "elapsed_time": "2:30:28", "remaining_time": "17:22:20"}
{"current_steps": 83, "total_steps": 650, "loss": 0.4148, "lr": 3.990663269435298e-05, "epoch": 0.6354066985645933, "percentage": 12.77, "elapsed_time": "2:32:19", "remaining_time": "17:20:37"}
{"current_steps": 84, "total_steps": 650, "loss": 0.4255, "lr": 3.989597963020289e-05, "epoch": 0.6430622009569378, "percentage": 12.92, "elapsed_time": "2:33:57", "remaining_time": "17:17:23"}
{"current_steps": 85, "total_steps": 650, "loss": 0.404, "lr": 3.9884752776948564e-05, "epoch": 0.6507177033492823, "percentage": 13.08, "elapsed_time": "2:35:33", "remaining_time": "17:14:02"}
{"current_steps": 86, "total_steps": 650, "loss": 0.4237, "lr": 3.9872952458366267e-05, "epoch": 0.6583732057416268, "percentage": 13.23, "elapsed_time": "2:37:26", "remaining_time": "17:12:33"}
{"current_steps": 87, "total_steps": 650, "loss": 0.4156, "lr": 3.986057901477069e-05, "epoch": 0.6660287081339713, "percentage": 13.38, "elapsed_time": "2:39:09", "remaining_time": "17:09:56"}
{"current_steps": 88, "total_steps": 650, "loss": 0.4211, "lr": 3.984763280300514e-05, "epoch": 0.6736842105263158, "percentage": 13.54, "elapsed_time": "2:41:08", "remaining_time": "17:09:05"}
{"current_steps": 89, "total_steps": 650, "loss": 0.442, "lr": 3.983411419643125e-05, "epoch": 0.6813397129186602, "percentage": 13.69, "elapsed_time": "2:43:11", "remaining_time": "17:08:36"}
{"current_steps": 90, "total_steps": 650, "loss": 0.416, "lr": 3.982002358491817e-05, "epoch": 0.6889952153110048, "percentage": 13.85, "elapsed_time": "2:45:03", "remaining_time": "17:07:01"}
{"current_steps": 91, "total_steps": 650, "loss": 0.4226, "lr": 3.980536137483141e-05, "epoch": 0.6966507177033493, "percentage": 14.0, "elapsed_time": "2:47:08", "remaining_time": "17:06:44"}
{"current_steps": 92, "total_steps": 650, "loss": 0.4135, "lr": 3.9790127989021024e-05, "epoch": 0.7043062200956938, "percentage": 14.15, "elapsed_time": "2:48:45", "remaining_time": "17:03:34"}
{"current_steps": 93, "total_steps": 650, "loss": 0.421, "lr": 3.9774323866809485e-05, "epoch": 0.7119617224880382, "percentage": 14.31, "elapsed_time": "2:50:37", "remaining_time": "17:01:54"}
{"current_steps": 94, "total_steps": 650, "loss": 0.4248, "lr": 3.9757949463978975e-05, "epoch": 0.7196172248803828, "percentage": 14.46, "elapsed_time": "2:52:33", "remaining_time": "17:00:38"}
{"current_steps": 95, "total_steps": 650, "loss": 0.4112, "lr": 3.9741005252758255e-05, "epoch": 0.7272727272727273, "percentage": 14.62, "elapsed_time": "2:54:27", "remaining_time": "16:59:11"}
{"current_steps": 96, "total_steps": 650, "loss": 0.4098, "lr": 3.9723491721809076e-05, "epoch": 0.7349282296650718, "percentage": 14.77, "elapsed_time": "2:56:35", "remaining_time": "16:59:06"}
{"current_steps": 97, "total_steps": 650, "loss": 0.4319, "lr": 3.970540937621201e-05, "epoch": 0.7425837320574162, "percentage": 14.92, "elapsed_time": "2:58:13", "remaining_time": "16:56:03"}
{"current_steps": 98, "total_steps": 650, "loss": 0.4218, "lr": 3.9686758737451955e-05, "epoch": 0.7502392344497608, "percentage": 15.08, "elapsed_time": "3:00:03", "remaining_time": "16:54:10"}
{"current_steps": 99, "total_steps": 650, "loss": 0.4146, "lr": 3.966754034340308e-05, "epoch": 0.7578947368421053, "percentage": 15.23, "elapsed_time": "3:01:56", "remaining_time": "16:52:39"}
{"current_steps": 100, "total_steps": 650, "loss": 0.3925, "lr": 3.9647754748313294e-05, "epoch": 0.7655502392344498, "percentage": 15.38, "elapsed_time": "3:03:43", "remaining_time": "16:50:26"}
{"current_steps": 101, "total_steps": 650, "loss": 0.4121, "lr": 3.962740252278827e-05, "epoch": 0.7732057416267942, "percentage": 15.54, "elapsed_time": "3:05:18", "remaining_time": "16:47:18"}
{"current_steps": 102, "total_steps": 650, "loss": 0.3992, "lr": 3.960648425377499e-05, "epoch": 0.7808612440191387, "percentage": 15.69, "elapsed_time": "3:07:22", "remaining_time": "16:46:42"}
{"current_steps": 103, "total_steps": 650, "loss": 0.3946, "lr": 3.958500054454482e-05, "epoch": 0.7885167464114833, "percentage": 15.85, "elapsed_time": "3:09:10", "remaining_time": "16:44:36"}
{"current_steps": 104, "total_steps": 650, "loss": 0.4165, "lr": 3.9562952014676116e-05, "epoch": 0.7961722488038278, "percentage": 16.0, "elapsed_time": "3:10:51", "remaining_time": "16:42:00"}
{"current_steps": 105, "total_steps": 650, "loss": 0.4402, "lr": 3.954033930003634e-05, "epoch": 0.8038277511961722, "percentage": 16.15, "elapsed_time": "3:12:51", "remaining_time": "16:41:01"}
{"current_steps": 106, "total_steps": 650, "loss": 0.4209, "lr": 3.9517163052763756e-05, "epoch": 0.8114832535885167, "percentage": 16.31, "elapsed_time": "3:14:45", "remaining_time": "16:39:31"}
{"current_steps": 107, "total_steps": 650, "loss": 0.4117, "lr": 3.9493423941248564e-05, "epoch": 0.8191387559808613, "percentage": 16.46, "elapsed_time": "3:16:34", "remaining_time": "16:37:36"}
{"current_steps": 108, "total_steps": 650, "loss": 0.4139, "lr": 3.946912265011368e-05, "epoch": 0.8267942583732057, "percentage": 16.62, "elapsed_time": "3:18:27", "remaining_time": "16:35:56"}
{"current_steps": 109, "total_steps": 650, "loss": 0.4098, "lr": 3.944425988019498e-05, "epoch": 0.8344497607655502, "percentage": 16.77, "elapsed_time": "3:20:32", "remaining_time": "16:35:21"}
{"current_steps": 110, "total_steps": 650, "loss": 0.4183, "lr": 3.9418836348521045e-05, "epoch": 0.8421052631578947, "percentage": 16.92, "elapsed_time": "3:22:39", "remaining_time": "16:34:50"}
{"current_steps": 111, "total_steps": 650, "loss": 0.3992, "lr": 3.9392852788292556e-05, "epoch": 0.8497607655502393, "percentage": 17.08, "elapsed_time": "3:24:35", "remaining_time": "16:33:27"}
{"current_steps": 112, "total_steps": 650, "loss": 0.4052, "lr": 3.936630994886109e-05, "epoch": 0.8574162679425837, "percentage": 17.23, "elapsed_time": "3:26:22", "remaining_time": "16:31:18"}
{"current_steps": 113, "total_steps": 650, "loss": 0.4009, "lr": 3.933920859570753e-05, "epoch": 0.8650717703349282, "percentage": 17.38, "elapsed_time": "3:28:07", "remaining_time": "16:29:03"}
{"current_steps": 114, "total_steps": 650, "loss": 0.4119, "lr": 3.931154951041998e-05, "epoch": 0.8727272727272727, "percentage": 17.54, "elapsed_time": "3:29:53", "remaining_time": "16:26:52"}
{"current_steps": 115, "total_steps": 650, "loss": 0.4295, "lr": 3.928333349067125e-05, "epoch": 0.8803827751196173, "percentage": 17.69, "elapsed_time": "3:31:47", "remaining_time": "16:25:15"}
{"current_steps": 116, "total_steps": 650, "loss": 0.3942, "lr": 3.925456135019582e-05, "epoch": 0.8880382775119617, "percentage": 17.85, "elapsed_time": "3:33:29", "remaining_time": "16:22:46"}
{"current_steps": 117, "total_steps": 650, "loss": 0.4184, "lr": 3.922523391876638e-05, "epoch": 0.8956937799043062, "percentage": 18.0, "elapsed_time": "3:35:13", "remaining_time": "16:20:29"}
{"current_steps": 118, "total_steps": 650, "loss": 0.4153, "lr": 3.9195352042169924e-05, "epoch": 0.9033492822966507, "percentage": 18.15, "elapsed_time": "3:36:58", "remaining_time": "16:18:12"}
{"current_steps": 119, "total_steps": 650, "loss": 0.4019, "lr": 3.916491658218333e-05, "epoch": 0.9110047846889953, "percentage": 18.31, "elapsed_time": "3:38:44", "remaining_time": "16:16:05"}
{"current_steps": 120, "total_steps": 650, "loss": 0.4068, "lr": 3.913392841654851e-05, "epoch": 0.9186602870813397, "percentage": 18.46, "elapsed_time": "3:40:29", "remaining_time": "16:13:50"}
{"current_steps": 121, "total_steps": 650, "loss": 0.4071, "lr": 3.9102388438947104e-05, "epoch": 0.9263157894736842, "percentage": 18.62, "elapsed_time": "3:42:05", "remaining_time": "16:10:56"}
{"current_steps": 122, "total_steps": 650, "loss": 0.4084, "lr": 3.907029755897473e-05, "epoch": 0.9339712918660287, "percentage": 18.77, "elapsed_time": "3:44:01", "remaining_time": "16:09:33"}
{"current_steps": 123, "total_steps": 650, "loss": 0.406, "lr": 3.903765670211469e-05, "epoch": 0.9416267942583733, "percentage": 18.92, "elapsed_time": "3:45:42", "remaining_time": "16:07:04"}
{"current_steps": 124, "total_steps": 650, "loss": 0.4129, "lr": 3.9004466809711343e-05, "epoch": 0.9492822966507177, "percentage": 19.08, "elapsed_time": "3:47:28", "remaining_time": "16:04:54"}
{"current_steps": 125, "total_steps": 650, "loss": 0.4082, "lr": 3.897072883894291e-05, "epoch": 0.9569377990430622, "percentage": 19.23, "elapsed_time": "3:49:07", "remaining_time": "16:02:19"}
{"current_steps": 126, "total_steps": 650, "loss": 0.3899, "lr": 3.893644376279392e-05, "epoch": 0.9645933014354067, "percentage": 19.38, "elapsed_time": "3:50:59", "remaining_time": "16:00:39"}
{"current_steps": 127, "total_steps": 650, "loss": 0.3981, "lr": 3.89016125700271e-05, "epoch": 0.9722488038277513, "percentage": 19.54, "elapsed_time": "3:52:45", "remaining_time": "15:58:30"}
{"current_steps": 128, "total_steps": 650, "loss": 0.4186, "lr": 3.8866236265154864e-05, "epoch": 0.9799043062200957, "percentage": 19.69, "elapsed_time": "3:54:44", "remaining_time": "15:57:19"}
{"current_steps": 129, "total_steps": 650, "loss": 0.404, "lr": 3.88303158684104e-05, "epoch": 0.9875598086124402, "percentage": 19.85, "elapsed_time": "3:56:33", "remaining_time": "15:55:23"}
{"current_steps": 130, "total_steps": 650, "loss": 0.4107, "lr": 3.879385241571817e-05, "epoch": 0.9952153110047847, "percentage": 20.0, "elapsed_time": "3:58:31", "remaining_time": "15:54:07"}
{"current_steps": 131, "total_steps": 650, "loss": 0.3982, "lr": 3.875684695866409e-05, "epoch": 1.0028708133971291, "percentage": 20.15, "elapsed_time": "4:12:19", "remaining_time": "16:39:40"}
{"current_steps": 132, "total_steps": 650, "loss": 0.346, "lr": 3.871930056446518e-05, "epoch": 1.0105263157894737, "percentage": 20.31, "elapsed_time": "4:14:03", "remaining_time": "16:36:58"}
{"current_steps": 133, "total_steps": 650, "loss": 0.3288, "lr": 3.8681214315938786e-05, "epoch": 1.018181818181818, "percentage": 20.46, "elapsed_time": "4:16:04", "remaining_time": "16:35:24"}
{"current_steps": 134, "total_steps": 650, "loss": 0.3318, "lr": 3.864258931147136e-05, "epoch": 1.0258373205741627, "percentage": 20.62, "elapsed_time": "4:17:53", "remaining_time": "16:33:06"}
{"current_steps": 135, "total_steps": 650, "loss": 0.3217, "lr": 3.860342666498677e-05, "epoch": 1.0334928229665072, "percentage": 20.77, "elapsed_time": "4:19:28", "remaining_time": "16:29:52"}
{"current_steps": 136, "total_steps": 650, "loss": 0.3149, "lr": 3.856372750591419e-05, "epoch": 1.0411483253588516, "percentage": 20.92, "elapsed_time": "4:21:24", "remaining_time": "16:27:59"}