| {"current_steps": 5, "total_steps": 600, "loss": 3.7984, "lr": 6.666666666666667e-06, "epoch": 0.12738853503184713, "percentage": 0.83, "elapsed_time": "0:00:07", "remaining_time": "0:14:40"} |
| {"current_steps": 10, "total_steps": 600, "loss": 3.8072, "lr": 1.5e-05, "epoch": 0.25477707006369427, "percentage": 1.67, "elapsed_time": "0:00:13", "remaining_time": "0:13:28"} |
| {"current_steps": 15, "total_steps": 600, "loss": 3.7454, "lr": 2.3333333333333336e-05, "epoch": 0.3821656050955414, "percentage": 2.5, "elapsed_time": "0:00:19", "remaining_time": "0:12:58"} |
| {"current_steps": 20, "total_steps": 600, "loss": 3.3677, "lr": 3.1666666666666666e-05, "epoch": 0.5095541401273885, "percentage": 3.33, "elapsed_time": "0:00:26", "remaining_time": "0:12:39"} |
| {"current_steps": 25, "total_steps": 600, "loss": 3.2859, "lr": 4e-05, "epoch": 0.6369426751592356, "percentage": 4.17, "elapsed_time": "0:00:32", "remaining_time": "0:12:24"} |
| {"current_steps": 25, "total_steps": 600, "eval_loss": 2.8292243480682373, "epoch": 0.6369426751592356, "percentage": 4.17, "elapsed_time": "0:00:33", "remaining_time": "0:12:51"} |
| {"current_steps": 30, "total_steps": 600, "loss": 2.8454, "lr": 4.8333333333333334e-05, "epoch": 0.7643312101910829, "percentage": 5.0, "elapsed_time": "0:00:39", "remaining_time": "0:12:34"} |
| {"current_steps": 35, "total_steps": 600, "loss": 2.5979, "lr": 4.999392477398737e-05, "epoch": 0.89171974522293, "percentage": 5.83, "elapsed_time": "0:00:45", "remaining_time": "0:12:19"} |
| {"current_steps": 40, "total_steps": 600, "loss": 2.5103, "lr": 4.996924922870762e-05, "epoch": 1.0, "percentage": 6.67, "elapsed_time": "0:00:51", "remaining_time": "0:11:54"} |
| {"current_steps": 45, "total_steps": 600, "loss": 2.1311, "lr": 4.992561238637912e-05, "epoch": 1.127388535031847, "percentage": 7.5, "elapsed_time": "0:00:57", "remaining_time": "0:11:46"} |
| {"current_steps": 50, "total_steps": 600, "loss": 2.0143, "lr": 4.9863047384206835e-05, "epoch": 1.2547770700636942, "percentage": 8.33, "elapsed_time": "0:01:03", "remaining_time": "0:11:37"} |
| {"current_steps": 50, "total_steps": 600, "eval_loss": 1.9939861297607422, "epoch": 1.2547770700636942, "percentage": 8.33, "elapsed_time": "0:01:04", "remaining_time": "0:11:50"} |
| {"current_steps": 55, "total_steps": 600, "loss": 2.0247, "lr": 4.978160173317438e-05, "epoch": 1.3821656050955413, "percentage": 9.17, "elapsed_time": "0:01:11", "remaining_time": "0:11:53"} |
| {"current_steps": 60, "total_steps": 600, "loss": 1.9287, "lr": 4.968133728196486e-05, "epoch": 1.5095541401273884, "percentage": 10.0, "elapsed_time": "0:01:18", "remaining_time": "0:11:43"} |
| {"current_steps": 65, "total_steps": 600, "loss": 1.7431, "lr": 4.956233016999379e-05, "epoch": 1.6369426751592355, "percentage": 10.83, "elapsed_time": "0:01:24", "remaining_time": "0:11:34"} |
| {"current_steps": 70, "total_steps": 600, "loss": 1.8979, "lr": 4.9424670769589984e-05, "epoch": 1.7643312101910829, "percentage": 11.67, "elapsed_time": "0:01:30", "remaining_time": "0:11:25"} |
| {"current_steps": 75, "total_steps": 600, "loss": 1.6829, "lr": 4.9268463617368e-05, "epoch": 1.89171974522293, "percentage": 12.5, "elapsed_time": "0:01:36", "remaining_time": "0:11:16"} |
| {"current_steps": 75, "total_steps": 600, "eval_loss": 1.7856135368347168, "epoch": 1.89171974522293, "percentage": 12.5, "elapsed_time": "0:01:37", "remaining_time": "0:11:24"} |
| {"current_steps": 80, "total_steps": 600, "loss": 1.6997, "lr": 4.9093827334844546e-05, "epoch": 2.0, "percentage": 13.33, "elapsed_time": "0:01:43", "remaining_time": "0:11:09"} |
| {"current_steps": 85, "total_steps": 600, "loss": 1.587, "lr": 4.8900894538358944e-05, "epoch": 2.127388535031847, "percentage": 14.17, "elapsed_time": "0:01:49", "remaining_time": "0:11:02"} |
| {"current_steps": 90, "total_steps": 600, "loss": 1.5455, "lr": 4.8689811738366155e-05, "epoch": 2.254777070063694, "percentage": 15.0, "elapsed_time": "0:01:55", "remaining_time": "0:10:55"} |
| {"current_steps": 95, "total_steps": 600, "loss": 1.5951, "lr": 4.8460739228178806e-05, "epoch": 2.3821656050955413, "percentage": 15.83, "elapsed_time": "0:02:01", "remaining_time": "0:10:48"} |
| {"current_steps": 100, "total_steps": 600, "loss": 1.4774, "lr": 4.821385096224268e-05, "epoch": 2.5095541401273884, "percentage": 16.67, "elapsed_time": "0:02:08", "remaining_time": "0:10:40"} |
| {"current_steps": 100, "total_steps": 600, "eval_loss": 1.7516053915023804, "epoch": 2.5095541401273884, "percentage": 16.67, "elapsed_time": "0:02:09", "remaining_time": "0:10:46"} |
| {"current_steps": 105, "total_steps": 600, "loss": 1.448, "lr": 4.7949334424038176e-05, "epoch": 2.6369426751592355, "percentage": 17.5, "elapsed_time": "0:02:16", "remaining_time": "0:10:44"} |
| {"current_steps": 110, "total_steps": 600, "loss": 1.4961, "lr": 4.7667390483707986e-05, "epoch": 2.7643312101910826, "percentage": 18.33, "elapsed_time": "0:02:22", "remaining_time": "0:10:35"} |
| {"current_steps": 115, "total_steps": 600, "loss": 1.4448, "lr": 4.736823324551909e-05, "epoch": 2.8917197452229297, "percentage": 19.17, "elapsed_time": "0:02:28", "remaining_time": "0:10:28"} |
| {"current_steps": 120, "total_steps": 600, "loss": 1.5377, "lr": 4.7052089885275055e-05, "epoch": 3.0, "percentage": 20.0, "elapsed_time": "0:02:34", "remaining_time": "0:10:16"} |
| {"current_steps": 125, "total_steps": 600, "loss": 1.1908, "lr": 4.671920047780186e-05, "epoch": 3.127388535031847, "percentage": 20.83, "elapsed_time": "0:02:40", "remaining_time": "0:10:09"} |
| {"current_steps": 125, "total_steps": 600, "eval_loss": 1.6817084550857544, "epoch": 3.127388535031847, "percentage": 20.83, "elapsed_time": "0:02:41", "remaining_time": "0:10:14"} |
| {"current_steps": 130, "total_steps": 600, "loss": 1.3108, "lr": 4.6369817814638475e-05, "epoch": 3.254777070063694, "percentage": 21.67, "elapsed_time": "0:02:47", "remaining_time": "0:10:07"} |
| {"current_steps": 135, "total_steps": 600, "loss": 1.1886, "lr": 4.600420721207053e-05, "epoch": 3.3821656050955413, "percentage": 22.5, "elapsed_time": "0:02:54", "remaining_time": "0:10:00"} |
| {"current_steps": 140, "total_steps": 600, "loss": 1.1127, "lr": 4.5622646309652794e-05, "epoch": 3.5095541401273884, "percentage": 23.33, "elapsed_time": "0:03:00", "remaining_time": "0:09:53"} |
| {"current_steps": 145, "total_steps": 600, "loss": 1.1102, "lr": 4.522542485937369e-05, "epoch": 3.6369426751592355, "percentage": 24.17, "elapsed_time": "0:03:06", "remaining_time": "0:09:45"} |
| {"current_steps": 150, "total_steps": 600, "loss": 1.2046, "lr": 4.481284450562163e-05, "epoch": 3.7643312101910826, "percentage": 25.0, "elapsed_time": "0:03:12", "remaining_time": "0:09:38"} |
| {"current_steps": 150, "total_steps": 600, "eval_loss": 1.6712156534194946, "epoch": 3.7643312101910826, "percentage": 25.0, "elapsed_time": "0:03:14", "remaining_time": "0:09:42"} |
| {"current_steps": 155, "total_steps": 600, "loss": 1.0573, "lr": 4.438521855612054e-05, "epoch": 3.8917197452229297, "percentage": 25.83, "elapsed_time": "0:03:21", "remaining_time": "0:09:37"} |
| {"current_steps": 160, "total_steps": 600, "loss": 1.3037, "lr": 4.3942871744008374e-05, "epoch": 4.0, "percentage": 26.67, "elapsed_time": "0:03:26", "remaining_time": "0:09:27"} |
| {"current_steps": 165, "total_steps": 600, "loss": 0.879, "lr": 4.3486139981239304e-05, "epoch": 4.127388535031847, "percentage": 27.5, "elapsed_time": "0:03:32", "remaining_time": "0:09:20"} |
| {"current_steps": 170, "total_steps": 600, "loss": 0.9412, "lr": 4.301537010349696e-05, "epoch": 4.254777070063694, "percentage": 28.33, "elapsed_time": "0:03:38", "remaining_time": "0:09:13"} |
| {"current_steps": 175, "total_steps": 600, "loss": 0.8012, "lr": 4.2530919606812216e-05, "epoch": 4.382165605095541, "percentage": 29.17, "elapsed_time": "0:03:44", "remaining_time": "0:09:06"} |
| {"current_steps": 175, "total_steps": 600, "eval_loss": 1.7618356943130493, "epoch": 4.382165605095541, "percentage": 29.17, "elapsed_time": "0:03:46", "remaining_time": "0:09:08"} |
| {"current_steps": 180, "total_steps": 600, "loss": 0.9443, "lr": 4.203315637608578e-05, "epoch": 4.509554140127388, "percentage": 30.0, "elapsed_time": "0:03:52", "remaining_time": "0:09:01"} |
| {"current_steps": 185, "total_steps": 600, "loss": 0.8479, "lr": 4.152245840572153e-05, "epoch": 4.6369426751592355, "percentage": 30.83, "elapsed_time": "0:03:58", "remaining_time": "0:08:54"} |
| {"current_steps": 190, "total_steps": 600, "loss": 0.8732, "lr": 4.099921351258292e-05, "epoch": 4.764331210191083, "percentage": 31.67, "elapsed_time": "0:04:04", "remaining_time": "0:08:47"} |
| {"current_steps": 195, "total_steps": 600, "loss": 0.8117, "lr": 4.046381904149024e-05, "epoch": 4.89171974522293, "percentage": 32.5, "elapsed_time": "0:04:10", "remaining_time": "0:08:41"} |
| {"current_steps": 200, "total_steps": 600, "loss": 0.9595, "lr": 3.991668156348261e-05, "epoch": 5.0, "percentage": 33.33, "elapsed_time": "0:04:16", "remaining_time": "0:08:32"} |
| {"current_steps": 200, "total_steps": 600, "eval_loss": 1.7216202020645142, "epoch": 5.0, "percentage": 33.33, "elapsed_time": "0:04:17", "remaining_time": "0:08:34"} |
| {"current_steps": 205, "total_steps": 600, "loss": 0.6461, "lr": 3.935821656707359e-05, "epoch": 5.127388535031847, "percentage": 34.17, "elapsed_time": "0:04:24", "remaining_time": "0:08:29"} |
| {"current_steps": 210, "total_steps": 600, "loss": 0.5982, "lr": 3.878884814273509e-05, "epoch": 5.254777070063694, "percentage": 35.0, "elapsed_time": "0:04:30", "remaining_time": "0:08:22"} |
| {"current_steps": 215, "total_steps": 600, "loss": 0.6205, "lr": 3.8209008660848974e-05, "epoch": 5.382165605095541, "percentage": 35.83, "elapsed_time": "0:04:36", "remaining_time": "0:08:15"} |
| {"current_steps": 220, "total_steps": 600, "loss": 0.5558, "lr": 3.76191384433711e-05, "epoch": 5.509554140127388, "percentage": 36.67, "elapsed_time": "0:04:43", "remaining_time": "0:08:08"} |
| {"current_steps": 225, "total_steps": 600, "loss": 0.5115, "lr": 3.7019685429456986e-05, "epoch": 5.6369426751592355, "percentage": 37.5, "elapsed_time": "0:04:49", "remaining_time": "0:08:02"} |
| {"current_steps": 225, "total_steps": 600, "eval_loss": 1.8211851119995117, "epoch": 5.6369426751592355, "percentage": 37.5, "elapsed_time": "0:04:50", "remaining_time": "0:08:04"} |
| {"current_steps": 230, "total_steps": 600, "loss": 0.6233, "lr": 3.6411104835303166e-05, "epoch": 5.764331210191083, "percentage": 38.33, "elapsed_time": "0:04:57", "remaining_time": "0:07:58"} |
| {"current_steps": 235, "total_steps": 600, "loss": 0.5701, "lr": 3.579385880846232e-05, "epoch": 5.89171974522293, "percentage": 39.17, "elapsed_time": "0:05:03", "remaining_time": "0:07:51"} |
| {"current_steps": 240, "total_steps": 600, "loss": 0.652, "lr": 3.516841607689501e-05, "epoch": 6.0, "percentage": 40.0, "elapsed_time": "0:05:08", "remaining_time": "0:07:43"} |
| {"current_steps": 245, "total_steps": 600, "loss": 0.3898, "lr": 3.453525159302415e-05, "epoch": 6.127388535031847, "percentage": 40.83, "elapsed_time": "0:05:14", "remaining_time": "0:07:36"} |
| {"current_steps": 250, "total_steps": 600, "loss": 0.4666, "lr": 3.389484617306292e-05, "epoch": 6.254777070063694, "percentage": 41.67, "elapsed_time": "0:05:21", "remaining_time": "0:07:29"} |
| {"current_steps": 250, "total_steps": 600, "eval_loss": 2.177734136581421, "epoch": 6.254777070063694, "percentage": 41.67, "elapsed_time": "0:05:22", "remaining_time": "0:07:30"} |
| {"current_steps": 255, "total_steps": 600, "loss": 0.3194, "lr": 3.3247686131889574e-05, "epoch": 6.382165605095541, "percentage": 42.5, "elapsed_time": "0:05:29", "remaining_time": "0:07:25"} |
| {"current_steps": 260, "total_steps": 600, "loss": 0.3603, "lr": 3.2594262913746865e-05, "epoch": 6.509554140127388, "percentage": 43.33, "elapsed_time": "0:05:35", "remaining_time": "0:07:18"} |
| {"current_steps": 265, "total_steps": 600, "loss": 0.4139, "lr": 3.1935072719046115e-05, "epoch": 6.6369426751592355, "percentage": 44.17, "elapsed_time": "0:05:41", "remaining_time": "0:07:11"} |
| {"current_steps": 270, "total_steps": 600, "loss": 0.398, "lr": 3.127061612755961e-05, "epoch": 6.764331210191083, "percentage": 45.0, "elapsed_time": "0:05:47", "remaining_time": "0:07:05"} |
| {"current_steps": 275, "total_steps": 600, "loss": 0.4082, "lr": 3.06013977182874e-05, "epoch": 6.89171974522293, "percentage": 45.83, "elapsed_time": "0:05:54", "remaining_time": "0:06:58"} |
| {"current_steps": 275, "total_steps": 600, "eval_loss": 2.0292844772338867, "epoch": 6.89171974522293, "percentage": 45.83, "elapsed_time": "0:05:55", "remaining_time": "0:06:59"} |
| {"current_steps": 280, "total_steps": 600, "loss": 0.3706, "lr": 2.9927925686287006e-05, "epoch": 7.0, "percentage": 46.67, "elapsed_time": "0:06:00", "remaining_time": "0:06:51"} |
| {"current_steps": 285, "total_steps": 600, "loss": 0.2333, "lr": 2.925071145675733e-05, "epoch": 7.127388535031847, "percentage": 47.5, "elapsed_time": "0:06:06", "remaining_time": "0:06:45"} |
| {"current_steps": 290, "total_steps": 600, "loss": 0.2746, "lr": 2.8570269296669466e-05, "epoch": 7.254777070063694, "percentage": 48.33, "elapsed_time": "0:06:12", "remaining_time": "0:06:38"} |
| {"current_steps": 295, "total_steps": 600, "loss": 0.2495, "lr": 2.788711592423966e-05, "epoch": 7.382165605095541, "percentage": 49.17, "elapsed_time": "0:06:19", "remaining_time": "0:06:31"} |
| {"current_steps": 300, "total_steps": 600, "loss": 0.2262, "lr": 2.720177011654067e-05, "epoch": 7.509554140127388, "percentage": 50.0, "elapsed_time": "0:06:25", "remaining_time": "0:06:25"} |
| {"current_steps": 300, "total_steps": 600, "eval_loss": 2.3396387100219727, "epoch": 7.509554140127388, "percentage": 50.0, "elapsed_time": "0:06:26", "remaining_time": "0:06:26"} |
| {"current_steps": 305, "total_steps": 600, "loss": 0.2665, "lr": 2.6514752315549847e-05, "epoch": 7.6369426751592355, "percentage": 50.83, "elapsed_time": "0:06:33", "remaining_time": "0:06:20"} |
| {"current_steps": 310, "total_steps": 600, "loss": 0.2769, "lr": 2.5826584232932706e-05, "epoch": 7.764331210191083, "percentage": 51.67, "elapsed_time": "0:06:39", "remaining_time": "0:06:14"} |
| {"current_steps": 315, "total_steps": 600, "loss": 0.2252, "lr": 2.5137788453862515e-05, "epoch": 7.89171974522293, "percentage": 52.5, "elapsed_time": "0:06:46", "remaining_time": "0:06:07"} |
| {"current_steps": 320, "total_steps": 600, "loss": 0.2672, "lr": 2.4448888040176365e-05, "epoch": 8.0, "percentage": 53.33, "elapsed_time": "0:06:51", "remaining_time": "0:05:59"} |
| {"current_steps": 325, "total_steps": 600, "loss": 0.1774, "lr": 2.3760406133169443e-05, "epoch": 8.127388535031848, "percentage": 54.17, "elapsed_time": "0:06:57", "remaining_time": "0:05:53"} |
| {"current_steps": 325, "total_steps": 600, "eval_loss": 2.345935821533203, "epoch": 8.127388535031848, "percentage": 54.17, "elapsed_time": "0:06:58", "remaining_time": "0:05:54"} |
| {"current_steps": 330, "total_steps": 600, "loss": 0.1316, "lr": 2.3072865556328822e-05, "epoch": 8.254777070063694, "percentage": 55.0, "elapsed_time": "0:07:05", "remaining_time": "0:05:47"} |
| {"current_steps": 335, "total_steps": 600, "loss": 0.1199, "lr": 2.238678841830867e-05, "epoch": 8.382165605095542, "percentage": 55.83, "elapsed_time": "0:07:11", "remaining_time": "0:05:41"} |
| {"current_steps": 340, "total_steps": 600, "loss": 0.1955, "lr": 2.1702695716448278e-05, "epoch": 8.509554140127388, "percentage": 56.67, "elapsed_time": "0:07:17", "remaining_time": "0:05:34"} |
| {"current_steps": 345, "total_steps": 600, "loss": 0.1369, "lr": 2.1021106941134012e-05, "epoch": 8.636942675159236, "percentage": 57.5, "elapsed_time": "0:07:23", "remaining_time": "0:05:28"} |
| {"current_steps": 350, "total_steps": 600, "loss": 0.1512, "lr": 2.0342539681305602e-05, "epoch": 8.764331210191083, "percentage": 58.33, "elapsed_time": "0:07:30", "remaining_time": "0:05:21"} |
| {"current_steps": 350, "total_steps": 600, "eval_loss": 2.4745495319366455, "epoch": 8.764331210191083, "percentage": 58.33, "elapsed_time": "0:07:31", "remaining_time": "0:05:22"} |
| {"current_steps": 355, "total_steps": 600, "loss": 0.1519, "lr": 1.9667509231406334e-05, "epoch": 8.89171974522293, "percentage": 59.17, "elapsed_time": "0:07:38", "remaining_time": "0:05:16"} |
| {"current_steps": 360, "total_steps": 600, "loss": 0.1857, "lr": 1.899652820007576e-05, "epoch": 9.0, "percentage": 60.0, "elapsed_time": "0:07:43", "remaining_time": "0:05:09"} |
| {"current_steps": 365, "total_steps": 600, "loss": 0.0731, "lr": 1.8330106120881846e-05, "epoch": 9.127388535031848, "percentage": 60.83, "elapsed_time": "0:07:49", "remaining_time": "0:05:02"} |
| {"current_steps": 370, "total_steps": 600, "loss": 0.0974, "lr": 1.7668749065388385e-05, "epoch": 9.254777070063694, "percentage": 61.67, "elapsed_time": "0:07:56", "remaining_time": "0:04:55"} |
| {"current_steps": 375, "total_steps": 600, "loss": 0.0719, "lr": 1.70129592588513e-05, "epoch": 9.382165605095542, "percentage": 62.5, "elapsed_time": "0:08:02", "remaining_time": "0:04:49"} |
| {"current_steps": 375, "total_steps": 600, "eval_loss": 2.771934747695923, "epoch": 9.382165605095542, "percentage": 62.5, "elapsed_time": "0:08:03", "remaining_time": "0:04:50"} |
| {"current_steps": 380, "total_steps": 600, "loss": 0.0901, "lr": 1.6363234698835896e-05, "epoch": 9.509554140127388, "percentage": 63.33, "elapsed_time": "0:08:09", "remaining_time": "0:04:43"} |
| {"current_steps": 385, "total_steps": 600, "loss": 0.1384, "lr": 1.5720068777044476e-05, "epoch": 9.636942675159236, "percentage": 64.17, "elapsed_time": "0:08:15", "remaining_time": "0:04:36"} |
| {"current_steps": 390, "total_steps": 600, "loss": 0.0785, "lr": 1.5083949904641654e-05, "epoch": 9.764331210191083, "percentage": 65.0, "elapsed_time": "0:08:22", "remaining_time": "0:04:30"} |
| {"current_steps": 395, "total_steps": 600, "loss": 0.0952, "lr": 1.44553611413617e-05, "epoch": 9.89171974522293, "percentage": 65.83, "elapsed_time": "0:08:28", "remaining_time": "0:04:23"} |
| {"current_steps": 400, "total_steps": 600, "loss": 0.0741, "lr": 1.383477982867984e-05, "epoch": 10.0, "percentage": 66.67, "elapsed_time": "0:08:33", "remaining_time": "0:04:16"} |
| {"current_steps": 400, "total_steps": 600, "eval_loss": 2.7705841064453125, "epoch": 10.0, "percentage": 66.67, "elapsed_time": "0:08:34", "remaining_time": "0:04:17"} |
| {"current_steps": 405, "total_steps": 600, "loss": 0.0545, "lr": 1.322267722732582e-05, "epoch": 10.127388535031848, "percentage": 67.5, "elapsed_time": "0:08:41", "remaining_time": "0:04:11"} |
| {"current_steps": 410, "total_steps": 600, "loss": 0.0576, "lr": 1.2619518159415139e-05, "epoch": 10.254777070063694, "percentage": 68.33, "elapsed_time": "0:08:47", "remaining_time": "0:04:04"} |
| {"current_steps": 415, "total_steps": 600, "loss": 0.0513, "lr": 1.202576065546963e-05, "epoch": 10.382165605095542, "percentage": 69.17, "elapsed_time": "0:08:53", "remaining_time": "0:03:57"} |
| {"current_steps": 420, "total_steps": 600, "loss": 0.061, "lr": 1.1441855606595545e-05, "epoch": 10.509554140127388, "percentage": 70.0, "elapsed_time": "0:09:00", "remaining_time": "0:03:51"} |
| {"current_steps": 425, "total_steps": 600, "loss": 0.0679, "lr": 1.0868246422083204e-05, "epoch": 10.636942675159236, "percentage": 70.83, "elapsed_time": "0:09:06", "remaining_time": "0:03:45"} |
| {"current_steps": 425, "total_steps": 600, "eval_loss": 2.8739261627197266, "epoch": 10.636942675159236, "percentage": 70.83, "elapsed_time": "0:09:07", "remaining_time": "0:03:45"} |
| {"current_steps": 430, "total_steps": 600, "loss": 0.0629, "lr": 1.0305368692688174e-05, "epoch": 10.764331210191083, "percentage": 71.67, "elapsed_time": "0:09:14", "remaining_time": "0:03:39"} |
| {"current_steps": 435, "total_steps": 600, "loss": 0.0557, "lr": 9.753649859849775e-06, "epoch": 10.89171974522293, "percentage": 72.5, "elapsed_time": "0:09:20", "remaining_time": "0:03:32"} |
| {"current_steps": 440, "total_steps": 600, "loss": 0.0572, "lr": 9.213508891098064e-06, "epoch": 11.0, "percentage": 73.33, "elapsed_time": "0:09:26", "remaining_time": "0:03:26"} |
| {"current_steps": 445, "total_steps": 600, "loss": 0.0381, "lr": 8.685355961895784e-06, "epoch": 11.127388535031848, "percentage": 74.17, "elapsed_time": "0:09:33", "remaining_time": "0:03:19"} |
| {"current_steps": 450, "total_steps": 600, "loss": 0.036, "lr": 8.169592144156885e-06, "epoch": 11.254777070063694, "percentage": 75.0, "elapsed_time": "0:09:40", "remaining_time": "0:03:13"} |
| {"current_steps": 450, "total_steps": 600, "eval_loss": 3.0192348957061768, "epoch": 11.254777070063694, "percentage": 75.0, "elapsed_time": "0:09:41", "remaining_time": "0:03:13"} |
| {"current_steps": 455, "total_steps": 600, "loss": 0.0416, "lr": 7.666609101678121e-06, "epoch": 11.382165605095542, "percentage": 75.83, "elapsed_time": "0:09:49", "remaining_time": "0:03:07"} |
| {"current_steps": 460, "total_steps": 600, "loss": 0.0469, "lr": 7.176788792715075e-06, "epoch": 11.509554140127388, "percentage": 76.67, "elapsed_time": "0:09:55", "remaining_time": "0:03:01"} |
| {"current_steps": 465, "total_steps": 600, "loss": 0.0593, "lr": 6.700503179928458e-06, "epoch": 11.636942675159236, "percentage": 77.5, "elapsed_time": "0:10:02", "remaining_time": "0:02:54"} |
| {"current_steps": 470, "total_steps": 600, "loss": 0.0322, "lr": 6.2381139479208564e-06, "epoch": 11.764331210191083, "percentage": 78.33, "elapsed_time": "0:10:09", "remaining_time": "0:02:48"} |
| {"current_steps": 475, "total_steps": 600, "loss": 0.03, "lr": 5.78997222857853e-06, "epoch": 11.89171974522293, "percentage": 79.17, "elapsed_time": "0:10:16", "remaining_time": "0:02:42"} |
| {"current_steps": 475, "total_steps": 600, "eval_loss": 3.0430448055267334, "epoch": 11.89171974522293, "percentage": 79.17, "elapsed_time": "0:10:17", "remaining_time": "0:02:42"} |
| {"current_steps": 480, "total_steps": 600, "loss": 0.0206, "lr": 5.356418334426791e-06, "epoch": 12.0, "percentage": 80.0, "elapsed_time": "0:10:22", "remaining_time": "0:02:35"} |
| {"current_steps": 485, "total_steps": 600, "loss": 0.0269, "lr": 4.937781500201474e-06, "epoch": 12.127388535031848, "percentage": 80.83, "elapsed_time": "0:10:28", "remaining_time": "0:02:29"} |
| {"current_steps": 490, "total_steps": 600, "loss": 0.0243, "lr": 4.534379632832692e-06, "epoch": 12.254777070063694, "percentage": 81.67, "elapsed_time": "0:10:35", "remaining_time": "0:02:22"} |
| {"current_steps": 495, "total_steps": 600, "loss": 0.0227, "lr": 4.146519070030757e-06, "epoch": 12.382165605095542, "percentage": 82.5, "elapsed_time": "0:10:41", "remaining_time": "0:02:16"} |
| {"current_steps": 500, "total_steps": 600, "loss": 0.0226, "lr": 3.7744943476576562e-06, "epoch": 12.509554140127388, "percentage": 83.33, "elapsed_time": "0:10:47", "remaining_time": "0:02:09"} |
| {"current_steps": 500, "total_steps": 600, "eval_loss": 3.151336908340454, "epoch": 12.509554140127388, "percentage": 83.33, "elapsed_time": "0:10:48", "remaining_time": "0:02:09"} |
| {"current_steps": 505, "total_steps": 600, "loss": 0.0206, "lr": 3.418587976060653e-06, "epoch": 12.636942675159236, "percentage": 84.17, "elapsed_time": "0:10:56", "remaining_time": "0:02:03"} |
| {"current_steps": 510, "total_steps": 600, "loss": 0.0287, "lr": 3.0790702255378974e-06, "epoch": 12.764331210191083, "percentage": 85.0, "elapsed_time": "0:11:02", "remaining_time": "0:01:56"} |
| {"current_steps": 515, "total_steps": 600, "loss": 0.0218, "lr": 2.7561989210989235e-06, "epoch": 12.89171974522293, "percentage": 85.83, "elapsed_time": "0:11:08", "remaining_time": "0:01:50"} |
| {"current_steps": 520, "total_steps": 600, "loss": 0.0268, "lr": 2.4502192466760276e-06, "epoch": 13.0, "percentage": 86.67, "elapsed_time": "0:11:14", "remaining_time": "0:01:43"} |
| {"current_steps": 525, "total_steps": 600, "loss": 0.0155, "lr": 2.1613635589349756e-06, "epoch": 13.127388535031848, "percentage": 87.5, "elapsed_time": "0:11:20", "remaining_time": "0:01:37"} |
| {"current_steps": 525, "total_steps": 600, "eval_loss": 3.1609668731689453, "epoch": 13.127388535031848, "percentage": 87.5, "elapsed_time": "0:11:22", "remaining_time": "0:01:37"} |
| {"current_steps": 530, "total_steps": 600, "loss": 0.017, "lr": 1.8898512108266569e-06, "epoch": 13.254777070063694, "percentage": 88.33, "elapsed_time": "0:11:28", "remaining_time": "0:01:30"} |
| {"current_steps": 535, "total_steps": 600, "loss": 0.0154, "lr": 1.6358883850134816e-06, "epoch": 13.382165605095542, "percentage": 89.17, "elapsed_time": "0:11:34", "remaining_time": "0:01:24"} |
| {"current_steps": 540, "total_steps": 600, "loss": 0.0205, "lr": 1.3996679372972304e-06, "epoch": 13.509554140127388, "percentage": 90.0, "elapsed_time": "0:11:40", "remaining_time": "0:01:17"} |
| {"current_steps": 545, "total_steps": 600, "loss": 0.0249, "lr": 1.1813692501670276e-06, "epoch": 13.636942675159236, "percentage": 90.83, "elapsed_time": "0:11:46", "remaining_time": "0:01:11"} |
| {"current_steps": 550, "total_steps": 600, "loss": 0.015, "lr": 9.811580965787965e-07, "epoch": 13.764331210191083, "percentage": 91.67, "elapsed_time": "0:11:52", "remaining_time": "0:01:04"} |
| {"current_steps": 550, "total_steps": 600, "eval_loss": 3.177839517593384, "epoch": 13.764331210191083, "percentage": 91.67, "elapsed_time": "0:11:54", "remaining_time": "0:01:04"} |
| {"current_steps": 555, "total_steps": 600, "loss": 0.0146, "lr": 7.991865140696331e-07, "epoch": 13.89171974522293, "percentage": 92.5, "elapsed_time": "0:12:01", "remaining_time": "0:00:58"} |
| {"current_steps": 560, "total_steps": 600, "loss": 0.0167, "lr": 6.355926893026054e-07, "epoch": 14.0, "percentage": 93.33, "elapsed_time": "0:12:06", "remaining_time": "0:00:51"} |
| {"current_steps": 565, "total_steps": 600, "loss": 0.0153, "lr": 4.905008531297661e-07, "epoch": 14.127388535031848, "percentage": 94.17, "elapsed_time": "0:12:13", "remaining_time": "0:00:45"} |
| {"current_steps": 570, "total_steps": 600, "loss": 0.017, "lr": 3.640211862529802e-07, "epoch": 14.254777070063694, "percentage": 95.0, "elapsed_time": "0:12:19", "remaining_time": "0:00:38"} |
| {"current_steps": 575, "total_steps": 600, "loss": 0.0169, "lr": 2.5624973555424815e-07, "epoch": 14.382165605095542, "percentage": 95.83, "elapsed_time": "0:12:25", "remaining_time": "0:00:32"} |
| {"current_steps": 575, "total_steps": 600, "eval_loss": 3.2097647190093994, "epoch": 14.382165605095542, "percentage": 95.83, "elapsed_time": "0:12:26", "remaining_time": "0:00:32"} |
| {"current_steps": 580, "total_steps": 600, "loss": 0.0131, "lr": 1.6726834115904643e-07, "epoch": 14.509554140127388, "percentage": 96.67, "elapsed_time": "0:12:32", "remaining_time": "0:00:25"} |
| {"current_steps": 585, "total_steps": 600, "loss": 0.0146, "lr": 9.71445742881022e-08, "epoch": 14.636942675159236, "percentage": 97.5, "elapsed_time": "0:12:39", "remaining_time": "0:00:19"} |
| {"current_steps": 590, "total_steps": 600, "loss": 0.0138, "lr": 4.593168594474728e-08, "epoch": 14.764331210191083, "percentage": 98.33, "elapsed_time": "0:12:45", "remaining_time": "0:00:12"} |
| {"current_steps": 595, "total_steps": 600, "loss": 0.0125, "lr": 1.3668566476848777e-08, "epoch": 14.89171974522293, "percentage": 99.17, "elapsed_time": "0:12:51", "remaining_time": "0:00:06"} |
| {"current_steps": 600, "total_steps": 600, "loss": 0.0223, "lr": 3.7971604404107854e-10, "epoch": 15.0, "percentage": 100.0, "elapsed_time": "0:12:56", "remaining_time": "0:00:00"} |
| {"current_steps": 600, "total_steps": 600, "eval_loss": 3.207829236984253, "epoch": 15.0, "percentage": 100.0, "elapsed_time": "0:12:57", "remaining_time": "0:00:00"} |
| {"current_steps": 600, "total_steps": 600, "epoch": 15.0, "percentage": 100.0, "elapsed_time": "0:12:59", "remaining_time": "0:00:00"} |
|
|