| {"current_steps": 1, "total_steps": 400, "loss": 0.7859, "lr": 0.0, "epoch": 0.2909090909090909, "percentage": 0.25, "elapsed_time": "0:00:08", "remaining_time": "0:54:43"} | |
| {"current_steps": 2, "total_steps": 400, "loss": 0.7965, "lr": 2.5e-08, "epoch": 0.5818181818181818, "percentage": 0.5, "elapsed_time": "0:00:14", "remaining_time": "0:48:18"} | |
| {"current_steps": 3, "total_steps": 400, "loss": 0.7893, "lr": 5e-08, "epoch": 0.8727272727272727, "percentage": 0.75, "elapsed_time": "0:00:21", "remaining_time": "0:47:43"} | |
| {"current_steps": 4, "total_steps": 400, "loss": 0.8701, "lr": 7.5e-08, "epoch": 1.0, "percentage": 1.0, "elapsed_time": "0:00:24", "remaining_time": "0:40:29"} | |
| {"current_steps": 1, "total_steps": 400, "loss": 0.7859, "lr": 0.0, "epoch": 0.2909090909090909, "percentage": 0.25, "elapsed_time": "0:00:08", "remaining_time": "0:59:46"} | |
| {"current_steps": 2, "total_steps": 400, "loss": 0.7965, "lr": 2.5e-08, "epoch": 0.5818181818181818, "percentage": 0.5, "elapsed_time": "0:00:14", "remaining_time": "0:49:28"} | |
| {"current_steps": 3, "total_steps": 400, "loss": 0.789, "lr": 5e-08, "epoch": 0.8727272727272727, "percentage": 0.75, "elapsed_time": "0:00:21", "remaining_time": "0:47:28"} | |
| {"current_steps": 4, "total_steps": 400, "loss": 0.8701, "lr": 7.5e-08, "epoch": 1.0, "percentage": 1.0, "elapsed_time": "0:00:24", "remaining_time": "0:40:04"} | |
| {"current_steps": 5, "total_steps": 400, "loss": 0.7781, "lr": 1e-07, "epoch": 1.290909090909091, "percentage": 1.25, "elapsed_time": "0:01:10", "remaining_time": "1:33:01"} | |
| {"current_steps": 6, "total_steps": 400, "loss": 0.7594, "lr": 1.25e-07, "epoch": 1.5818181818181818, "percentage": 1.5, "elapsed_time": "0:01:16", "remaining_time": "1:24:13"} | |
| {"current_steps": 7, "total_steps": 400, "loss": 0.8306, "lr": 1.5e-07, "epoch": 1.8727272727272726, "percentage": 1.75, "elapsed_time": "0:01:23", "remaining_time": "1:17:59"} | |
| {"current_steps": 8, "total_steps": 400, "loss": 0.8823, "lr": 1.75e-07, "epoch": 2.0, "percentage": 2.0, "elapsed_time": "0:01:26", "remaining_time": "1:10:30"} | |
| {"current_steps": 1, "total_steps": 400, "loss": 0.7859, "lr": 0.0, "epoch": 0.2909090909090909, "percentage": 0.25, "elapsed_time": "0:00:07", "remaining_time": "0:47:14"} | |
| {"current_steps": 2, "total_steps": 400, "loss": 0.7965, "lr": 2.5e-08, "epoch": 0.5818181818181818, "percentage": 0.5, "elapsed_time": "0:00:13", "remaining_time": "0:43:46"} | |
| {"current_steps": 3, "total_steps": 400, "loss": 0.7894, "lr": 5e-08, "epoch": 0.8727272727272727, "percentage": 0.75, "elapsed_time": "0:00:20", "remaining_time": "0:44:26"} | |
| {"current_steps": 4, "total_steps": 400, "loss": 0.8702, "lr": 7.5e-08, "epoch": 1.0, "percentage": 1.0, "elapsed_time": "0:00:22", "remaining_time": "0:37:53"} | |
| {"current_steps": 5, "total_steps": 400, "loss": 0.7782, "lr": 1e-07, "epoch": 1.290909090909091, "percentage": 1.25, "elapsed_time": "0:01:12", "remaining_time": "1:35:46"} | |
| {"current_steps": 6, "total_steps": 400, "loss": 0.7593, "lr": 1.25e-07, "epoch": 1.5818181818181818, "percentage": 1.5, "elapsed_time": "0:01:19", "remaining_time": "1:26:36"} | |
| {"current_steps": 7, "total_steps": 400, "loss": 0.8308, "lr": 1.5e-07, "epoch": 1.8727272727272726, "percentage": 1.75, "elapsed_time": "0:01:25", "remaining_time": "1:20:14"} | |
| {"current_steps": 8, "total_steps": 400, "loss": 0.8818, "lr": 1.75e-07, "epoch": 2.0, "percentage": 2.0, "elapsed_time": "0:01:29", "remaining_time": "1:12:46"} | |
| {"current_steps": 9, "total_steps": 400, "loss": 0.7997, "lr": 2e-07, "epoch": 2.290909090909091, "percentage": 2.25, "elapsed_time": "0:02:08", "remaining_time": "1:33:13"} | |
| {"current_steps": 10, "total_steps": 400, "loss": 0.8195, "lr": 2.25e-07, "epoch": 2.581818181818182, "percentage": 2.5, "elapsed_time": "0:02:14", "remaining_time": "1:27:40"} | |
| {"current_steps": 11, "total_steps": 400, "loss": 0.7756, "lr": 2.5e-07, "epoch": 2.8727272727272726, "percentage": 2.75, "elapsed_time": "0:02:21", "remaining_time": "1:23:29"} | |
| {"current_steps": 12, "total_steps": 400, "loss": 0.8277, "lr": 2.75e-07, "epoch": 3.0, "percentage": 3.0, "elapsed_time": "0:02:24", "remaining_time": "1:17:59"} | |
| {"current_steps": 13, "total_steps": 400, "loss": 0.8359, "lr": 3e-07, "epoch": 3.290909090909091, "percentage": 3.25, "elapsed_time": "0:03:05", "remaining_time": "1:32:08"} | |
| {"current_steps": 14, "total_steps": 400, "loss": 0.8357, "lr": 3.25e-07, "epoch": 3.581818181818182, "percentage": 3.5, "elapsed_time": "0:03:11", "remaining_time": "1:28:10"} | |
| {"current_steps": 15, "total_steps": 400, "loss": 0.7685, "lr": 3.5e-07, "epoch": 3.8727272727272726, "percentage": 3.75, "elapsed_time": "0:03:18", "remaining_time": "1:25:02"} | |
| {"current_steps": 16, "total_steps": 400, "loss": 0.6977, "lr": 3.75e-07, "epoch": 4.0, "percentage": 4.0, "elapsed_time": "0:03:21", "remaining_time": "1:20:36"} | |
| {"current_steps": 17, "total_steps": 400, "loss": 0.772, "lr": 4e-07, "epoch": 4.290909090909091, "percentage": 4.25, "elapsed_time": "0:04:09", "remaining_time": "1:33:48"} | |
| {"current_steps": 18, "total_steps": 400, "loss": 0.8564, "lr": 4.2499999999999995e-07, "epoch": 4.581818181818182, "percentage": 4.5, "elapsed_time": "0:04:16", "remaining_time": "1:30:38"} | |
| {"current_steps": 19, "total_steps": 400, "loss": 0.7761, "lr": 4.5e-07, "epoch": 4.872727272727273, "percentage": 4.75, "elapsed_time": "0:04:23", "remaining_time": "1:27:58"} | |
| {"current_steps": 20, "total_steps": 400, "loss": 0.7591, "lr": 4.7499999999999995e-07, "epoch": 5.0, "percentage": 5.0, "elapsed_time": "0:04:26", "remaining_time": "1:24:14"} | |
| {"current_steps": 21, "total_steps": 400, "loss": 0.7278, "lr": 5e-07, "epoch": 5.290909090909091, "percentage": 5.25, "elapsed_time": "0:05:07", "remaining_time": "1:32:31"} | |
| {"current_steps": 22, "total_steps": 400, "loss": 0.7982, "lr": 5.25e-07, "epoch": 5.581818181818182, "percentage": 5.5, "elapsed_time": "0:05:14", "remaining_time": "1:30:00"} | |
| {"current_steps": 23, "total_steps": 400, "loss": 0.8049, "lr": 5.5e-07, "epoch": 5.872727272727273, "percentage": 5.75, "elapsed_time": "0:05:21", "remaining_time": "1:27:43"} | |
| {"current_steps": 24, "total_steps": 400, "loss": 0.8064, "lr": 5.749999999999999e-07, "epoch": 6.0, "percentage": 6.0, "elapsed_time": "0:05:23", "remaining_time": "1:24:31"} | |
| {"current_steps": 1, "total_steps": 400, "loss": 0.7859, "lr": 0.0, "epoch": 0.2909090909090909, "percentage": 0.25, "elapsed_time": "0:00:08", "remaining_time": "0:55:32"} | |
| {"current_steps": 2, "total_steps": 400, "loss": 0.7965, "lr": 2.5e-08, "epoch": 0.5818181818181818, "percentage": 0.5, "elapsed_time": "0:00:14", "remaining_time": "0:48:09"} | |
| {"current_steps": 3, "total_steps": 400, "loss": 0.7892, "lr": 5e-08, "epoch": 0.8727272727272727, "percentage": 0.75, "elapsed_time": "0:00:21", "remaining_time": "0:46:56"} | |
| {"current_steps": 4, "total_steps": 400, "loss": 0.8702, "lr": 7.5e-08, "epoch": 1.0, "percentage": 1.0, "elapsed_time": "0:00:24", "remaining_time": "0:39:42"} | |
| {"current_steps": 5, "total_steps": 400, "loss": 0.7783, "lr": 1e-07, "epoch": 1.290909090909091, "percentage": 1.25, "elapsed_time": "0:00:30", "remaining_time": "0:40:37"} | |
| {"current_steps": 6, "total_steps": 400, "loss": 0.7594, "lr": 1.25e-07, "epoch": 1.5818181818181818, "percentage": 1.5, "elapsed_time": "0:00:37", "remaining_time": "0:40:32"} | |
| {"current_steps": 7, "total_steps": 400, "loss": 0.8305, "lr": 1.5e-07, "epoch": 1.8727272727272726, "percentage": 1.75, "elapsed_time": "0:00:43", "remaining_time": "0:40:33"} | |
| {"current_steps": 8, "total_steps": 400, "loss": 0.8818, "lr": 1.75e-07, "epoch": 2.0, "percentage": 2.0, "elapsed_time": "0:00:46", "remaining_time": "0:37:48"} | |
| {"current_steps": 9, "total_steps": 400, "loss": 0.7999, "lr": 2e-07, "epoch": 2.290909090909091, "percentage": 2.25, "elapsed_time": "0:00:52", "remaining_time": "0:38:20"} | |
| {"current_steps": 10, "total_steps": 400, "loss": 0.8195, "lr": 2.25e-07, "epoch": 2.581818181818182, "percentage": 2.5, "elapsed_time": "0:00:58", "remaining_time": "0:38:16"} | |
| {"current_steps": 11, "total_steps": 400, "loss": 0.7757, "lr": 2.5e-07, "epoch": 2.8727272727272726, "percentage": 2.75, "elapsed_time": "0:01:05", "remaining_time": "0:38:39"} | |
| {"current_steps": 12, "total_steps": 400, "loss": 0.8272, "lr": 2.75e-07, "epoch": 3.0, "percentage": 3.0, "elapsed_time": "0:01:08", "remaining_time": "0:36:59"} | |
| {"current_steps": 13, "total_steps": 400, "loss": 0.8356, "lr": 3e-07, "epoch": 3.290909090909091, "percentage": 3.25, "elapsed_time": "0:01:15", "remaining_time": "0:37:18"} | |
| {"current_steps": 14, "total_steps": 400, "loss": 0.8362, "lr": 3.25e-07, "epoch": 3.581818181818182, "percentage": 3.5, "elapsed_time": "0:01:21", "remaining_time": "0:37:21"} | |
| {"current_steps": 15, "total_steps": 400, "loss": 0.7687, "lr": 3.5e-07, "epoch": 3.8727272727272726, "percentage": 3.75, "elapsed_time": "0:01:28", "remaining_time": "0:37:40"} | |
| {"current_steps": 16, "total_steps": 400, "loss": 0.6977, "lr": 3.75e-07, "epoch": 4.0, "percentage": 4.0, "elapsed_time": "0:01:30", "remaining_time": "0:36:19"} | |
| {"current_steps": 17, "total_steps": 400, "loss": 0.7719, "lr": 4e-07, "epoch": 4.290909090909091, "percentage": 4.25, "elapsed_time": "0:01:37", "remaining_time": "0:36:31"} | |
| {"current_steps": 18, "total_steps": 400, "loss": 0.857, "lr": 4.2499999999999995e-07, "epoch": 4.581818181818182, "percentage": 4.5, "elapsed_time": "0:01:43", "remaining_time": "0:36:36"} | |
| {"current_steps": 19, "total_steps": 400, "loss": 0.7761, "lr": 4.5e-07, "epoch": 4.872727272727273, "percentage": 4.75, "elapsed_time": "0:01:50", "remaining_time": "0:36:50"} | |
| {"current_steps": 20, "total_steps": 400, "loss": 0.7588, "lr": 4.7499999999999995e-07, "epoch": 5.0, "percentage": 5.0, "elapsed_time": "0:01:52", "remaining_time": "0:35:46"} | |
| {"current_steps": 21, "total_steps": 400, "loss": 0.7277, "lr": 5e-07, "epoch": 5.290909090909091, "percentage": 5.25, "elapsed_time": "0:01:59", "remaining_time": "0:35:53"} | |
| {"current_steps": 22, "total_steps": 400, "loss": 0.7982, "lr": 5.25e-07, "epoch": 5.581818181818182, "percentage": 5.5, "elapsed_time": "0:02:06", "remaining_time": "0:36:05"} | |
| {"current_steps": 23, "total_steps": 400, "loss": 0.8048, "lr": 5.5e-07, "epoch": 5.872727272727273, "percentage": 5.75, "elapsed_time": "0:02:12", "remaining_time": "0:36:14"} | |
| {"current_steps": 24, "total_steps": 400, "loss": 0.8067, "lr": 5.749999999999999e-07, "epoch": 6.0, "percentage": 6.0, "elapsed_time": "0:02:15", "remaining_time": "0:35:18"} | |
| {"current_steps": 25, "total_steps": 400, "loss": 0.8101, "lr": 6e-07, "epoch": 6.290909090909091, "percentage": 6.25, "elapsed_time": "0:02:21", "remaining_time": "0:35:27"} | |
| {"current_steps": 26, "total_steps": 400, "loss": 0.7327, "lr": 6.249999999999999e-07, "epoch": 6.581818181818182, "percentage": 6.5, "elapsed_time": "0:02:28", "remaining_time": "0:35:34"} | |
| {"current_steps": 27, "total_steps": 400, "loss": 0.7906, "lr": 6.5e-07, "epoch": 6.872727272727273, "percentage": 6.75, "elapsed_time": "0:02:34", "remaining_time": "0:35:38"} | |
| {"current_steps": 28, "total_steps": 400, "loss": 0.6975, "lr": 6.75e-07, "epoch": 7.0, "percentage": 7.0, "elapsed_time": "0:02:37", "remaining_time": "0:34:50"} | |
| {"current_steps": 29, "total_steps": 400, "loss": 0.7316, "lr": 7e-07, "epoch": 7.290909090909091, "percentage": 7.25, "elapsed_time": "0:02:43", "remaining_time": "0:34:54"} | |
| {"current_steps": 30, "total_steps": 400, "loss": 0.7377, "lr": 7.249999999999999e-07, "epoch": 7.581818181818182, "percentage": 7.5, "elapsed_time": "0:02:50", "remaining_time": "0:34:57"} | |
| {"current_steps": 31, "total_steps": 400, "loss": 0.7336, "lr": 7.5e-07, "epoch": 7.872727272727273, "percentage": 7.75, "elapsed_time": "0:02:57", "remaining_time": "0:35:07"} | |
| {"current_steps": 32, "total_steps": 400, "loss": 0.8509, "lr": 7.75e-07, "epoch": 8.0, "percentage": 8.0, "elapsed_time": "0:02:59", "remaining_time": "0:34:24"} | |
| {"current_steps": 33, "total_steps": 400, "loss": 0.7248, "lr": 8e-07, "epoch": 8.290909090909091, "percentage": 8.25, "elapsed_time": "0:03:06", "remaining_time": "0:34:31"} | |
| {"current_steps": 34, "total_steps": 400, "loss": 0.7692, "lr": 8.249999999999999e-07, "epoch": 8.581818181818182, "percentage": 8.5, "elapsed_time": "0:03:12", "remaining_time": "0:34:36"} | |
| {"current_steps": 35, "total_steps": 400, "loss": 0.6783, "lr": 8.499999999999999e-07, "epoch": 8.872727272727273, "percentage": 8.75, "elapsed_time": "0:03:18", "remaining_time": "0:34:33"} | |
| {"current_steps": 36, "total_steps": 400, "loss": 0.7678, "lr": 8.75e-07, "epoch": 9.0, "percentage": 9.0, "elapsed_time": "0:03:21", "remaining_time": "0:33:59"} | |
| {"current_steps": 37, "total_steps": 400, "loss": 0.6887, "lr": 9e-07, "epoch": 9.290909090909091, "percentage": 9.25, "elapsed_time": "0:03:28", "remaining_time": "0:34:01"} | |
| {"current_steps": 38, "total_steps": 400, "loss": 0.7304, "lr": 9.25e-07, "epoch": 9.581818181818182, "percentage": 9.5, "elapsed_time": "0:03:34", "remaining_time": "0:34:07"} | |
| {"current_steps": 39, "total_steps": 400, "loss": 0.6685, "lr": 9.499999999999999e-07, "epoch": 9.872727272727273, "percentage": 9.75, "elapsed_time": "0:03:41", "remaining_time": "0:34:08"} | |
| {"current_steps": 40, "total_steps": 400, "loss": 0.5981, "lr": 9.75e-07, "epoch": 10.0, "percentage": 10.0, "elapsed_time": "0:03:44", "remaining_time": "0:33:36"} | |
| {"current_steps": 41, "total_steps": 400, "loss": 0.6196, "lr": 1e-06, "epoch": 10.290909090909091, "percentage": 10.25, "elapsed_time": "0:03:50", "remaining_time": "0:33:38"} | |
| {"current_steps": 42, "total_steps": 400, "loss": 0.6595, "lr": 9.999809615320856e-07, "epoch": 10.581818181818182, "percentage": 10.5, "elapsed_time": "0:03:57", "remaining_time": "0:33:41"} | |
| {"current_steps": 43, "total_steps": 400, "loss": 0.6998, "lr": 9.999238475781957e-07, "epoch": 10.872727272727273, "percentage": 10.75, "elapsed_time": "0:04:03", "remaining_time": "0:33:42"} | |
| {"current_steps": 1, "total_steps": 400, "loss": 0.7859, "lr": 0.0, "epoch": 0.2909090909090909, "percentage": 0.25, "elapsed_time": "0:00:07", "remaining_time": "0:48:47"} | |
| {"current_steps": 2, "total_steps": 400, "loss": 0.7965, "lr": 2.5e-08, "epoch": 0.5818181818181818, "percentage": 0.5, "elapsed_time": "0:00:13", "remaining_time": "0:44:43"} | |
| {"current_steps": 3, "total_steps": 400, "loss": 0.7891, "lr": 5e-08, "epoch": 0.8727272727272727, "percentage": 0.75, "elapsed_time": "0:00:20", "remaining_time": "0:44:43"} | |
| {"current_steps": 4, "total_steps": 400, "loss": 0.8702, "lr": 7.5e-08, "epoch": 1.0, "percentage": 1.0, "elapsed_time": "0:00:23", "remaining_time": "0:38:09"} | |
| {"current_steps": 5, "total_steps": 400, "loss": 0.7781, "lr": 1e-07, "epoch": 1.290909090909091, "percentage": 1.25, "elapsed_time": "0:00:30", "remaining_time": "0:39:37"} | |
| {"current_steps": 6, "total_steps": 400, "loss": 0.7592, "lr": 1.25e-07, "epoch": 1.5818181818181818, "percentage": 1.5, "elapsed_time": "0:00:36", "remaining_time": "0:39:48"} | |
| {"current_steps": 7, "total_steps": 400, "loss": 0.8304, "lr": 1.5e-07, "epoch": 1.8727272727272726, "percentage": 1.75, "elapsed_time": "0:00:42", "remaining_time": "0:39:57"} | |
| {"current_steps": 8, "total_steps": 400, "loss": 0.8826, "lr": 1.75e-07, "epoch": 2.0, "percentage": 2.0, "elapsed_time": "0:00:45", "remaining_time": "0:37:19"} | |
| {"current_steps": 9, "total_steps": 400, "loss": 0.7995, "lr": 2e-07, "epoch": 2.290909090909091, "percentage": 2.25, "elapsed_time": "0:00:52", "remaining_time": "0:37:55"} | |
| {"current_steps": 10, "total_steps": 400, "loss": 0.8191, "lr": 2.25e-07, "epoch": 2.581818181818182, "percentage": 2.5, "elapsed_time": "0:00:58", "remaining_time": "0:37:53"} | |
| {"current_steps": 11, "total_steps": 400, "loss": 0.7757, "lr": 2.5e-07, "epoch": 2.8727272727272726, "percentage": 2.75, "elapsed_time": "0:01:04", "remaining_time": "0:38:16"} | |
| {"current_steps": 12, "total_steps": 400, "loss": 0.8279, "lr": 2.75e-07, "epoch": 3.0, "percentage": 3.0, "elapsed_time": "0:01:08", "remaining_time": "0:36:38"} | |
| {"current_steps": 13, "total_steps": 400, "loss": 0.8357, "lr": 3e-07, "epoch": 3.290909090909091, "percentage": 3.25, "elapsed_time": "0:01:14", "remaining_time": "0:37:03"} | |
| {"current_steps": 14, "total_steps": 400, "loss": 0.8365, "lr": 3.25e-07, "epoch": 3.581818181818182, "percentage": 3.5, "elapsed_time": "0:01:20", "remaining_time": "0:37:09"} | |
| {"current_steps": 15, "total_steps": 400, "loss": 0.7686, "lr": 3.5e-07, "epoch": 3.8727272727272726, "percentage": 3.75, "elapsed_time": "0:01:27", "remaining_time": "0:37:31"} | |
| {"current_steps": 16, "total_steps": 400, "loss": 0.6977, "lr": 3.75e-07, "epoch": 4.0, "percentage": 4.0, "elapsed_time": "0:01:30", "remaining_time": "0:36:10"} | |
| {"current_steps": 17, "total_steps": 400, "loss": 0.772, "lr": 4e-07, "epoch": 4.290909090909091, "percentage": 4.25, "elapsed_time": "0:01:36", "remaining_time": "0:36:24"} | |
| {"current_steps": 18, "total_steps": 400, "loss": 0.8569, "lr": 4.2499999999999995e-07, "epoch": 4.581818181818182, "percentage": 4.5, "elapsed_time": "0:01:43", "remaining_time": "0:36:30"} | |
| {"current_steps": 19, "total_steps": 400, "loss": 0.7768, "lr": 4.5e-07, "epoch": 4.872727272727273, "percentage": 4.75, "elapsed_time": "0:01:50", "remaining_time": "0:36:46"} | |
| {"current_steps": 20, "total_steps": 400, "loss": 0.7591, "lr": 4.7499999999999995e-07, "epoch": 5.0, "percentage": 5.0, "elapsed_time": "0:01:52", "remaining_time": "0:35:45"} | |
| {"current_steps": 21, "total_steps": 400, "loss": 0.7275, "lr": 5e-07, "epoch": 5.290909090909091, "percentage": 5.25, "elapsed_time": "0:01:59", "remaining_time": "0:35:54"} | |
| {"current_steps": 22, "total_steps": 400, "loss": 0.7987, "lr": 5.25e-07, "epoch": 5.581818181818182, "percentage": 5.5, "elapsed_time": "0:02:06", "remaining_time": "0:36:06"} | |
| {"current_steps": 23, "total_steps": 400, "loss": 0.8043, "lr": 5.5e-07, "epoch": 5.872727272727273, "percentage": 5.75, "elapsed_time": "0:02:12", "remaining_time": "0:36:16"} | |
| {"current_steps": 24, "total_steps": 400, "loss": 0.8067, "lr": 5.749999999999999e-07, "epoch": 6.0, "percentage": 6.0, "elapsed_time": "0:02:15", "remaining_time": "0:35:22"} | |
| {"current_steps": 25, "total_steps": 400, "loss": 0.8101, "lr": 6e-07, "epoch": 6.290909090909091, "percentage": 6.25, "elapsed_time": "0:02:22", "remaining_time": "0:35:32"} | |
| {"current_steps": 26, "total_steps": 400, "loss": 0.7324, "lr": 6.249999999999999e-07, "epoch": 6.581818181818182, "percentage": 6.5, "elapsed_time": "0:02:28", "remaining_time": "0:35:41"} | |
| {"current_steps": 27, "total_steps": 400, "loss": 0.7906, "lr": 6.5e-07, "epoch": 6.872727272727273, "percentage": 6.75, "elapsed_time": "0:02:35", "remaining_time": "0:35:46"} | |
| {"current_steps": 28, "total_steps": 400, "loss": 0.6972, "lr": 6.75e-07, "epoch": 7.0, "percentage": 7.0, "elapsed_time": "0:02:37", "remaining_time": "0:34:59"} | |
| {"current_steps": 29, "total_steps": 400, "loss": 0.7314, "lr": 7e-07, "epoch": 7.290909090909091, "percentage": 7.25, "elapsed_time": "0:02:44", "remaining_time": "0:35:03"} | |
| {"current_steps": 30, "total_steps": 400, "loss": 0.7376, "lr": 7.249999999999999e-07, "epoch": 7.581818181818182, "percentage": 7.5, "elapsed_time": "0:02:50", "remaining_time": "0:35:07"} | |
| {"current_steps": 31, "total_steps": 400, "loss": 0.7336, "lr": 7.5e-07, "epoch": 7.872727272727273, "percentage": 7.75, "elapsed_time": "0:02:57", "remaining_time": "0:35:17"} | |
| {"current_steps": 32, "total_steps": 400, "loss": 0.8508, "lr": 7.75e-07, "epoch": 8.0, "percentage": 8.0, "elapsed_time": "0:03:00", "remaining_time": "0:34:35"} | |
| {"current_steps": 33, "total_steps": 400, "loss": 0.7245, "lr": 8e-07, "epoch": 8.290909090909091, "percentage": 8.25, "elapsed_time": "0:03:07", "remaining_time": "0:34:42"} | |
| {"current_steps": 34, "total_steps": 400, "loss": 0.7691, "lr": 8.249999999999999e-07, "epoch": 8.581818181818182, "percentage": 8.5, "elapsed_time": "0:03:14", "remaining_time": "0:34:48"} | |
| {"current_steps": 35, "total_steps": 400, "loss": 0.6785, "lr": 8.499999999999999e-07, "epoch": 8.872727272727273, "percentage": 8.75, "elapsed_time": "0:03:20", "remaining_time": "0:34:45"} | |
| {"current_steps": 36, "total_steps": 400, "loss": 0.7678, "lr": 8.75e-07, "epoch": 9.0, "percentage": 9.0, "elapsed_time": "0:03:22", "remaining_time": "0:34:11"} | |
| {"current_steps": 37, "total_steps": 400, "loss": 0.6887, "lr": 9e-07, "epoch": 9.290909090909091, "percentage": 9.25, "elapsed_time": "0:03:29", "remaining_time": "0:34:12"} | |
| {"current_steps": 38, "total_steps": 400, "loss": 0.7303, "lr": 9.25e-07, "epoch": 9.581818181818182, "percentage": 9.5, "elapsed_time": "0:03:36", "remaining_time": "0:34:18"} | |
| {"current_steps": 39, "total_steps": 400, "loss": 0.6687, "lr": 9.499999999999999e-07, "epoch": 9.872727272727273, "percentage": 9.75, "elapsed_time": "0:03:42", "remaining_time": "0:34:19"} | |
| {"current_steps": 40, "total_steps": 400, "loss": 0.5979, "lr": 9.75e-07, "epoch": 10.0, "percentage": 10.0, "elapsed_time": "0:03:45", "remaining_time": "0:33:48"} | |
| {"current_steps": 41, "total_steps": 400, "loss": 0.6194, "lr": 1e-06, "epoch": 10.290909090909091, "percentage": 10.25, "elapsed_time": "0:03:51", "remaining_time": "0:33:50"} | |
| {"current_steps": 42, "total_steps": 400, "loss": 0.6596, "lr": 9.999809615320856e-07, "epoch": 10.581818181818182, "percentage": 10.5, "elapsed_time": "0:03:58", "remaining_time": "0:33:53"} | |
| {"current_steps": 43, "total_steps": 400, "loss": 0.6998, "lr": 9.999238475781957e-07, "epoch": 10.872727272727273, "percentage": 10.75, "elapsed_time": "0:04:05", "remaining_time": "0:33:55"} | |
| {"current_steps": 44, "total_steps": 400, "loss": 0.6691, "lr": 9.998286624877785e-07, "epoch": 11.0, "percentage": 11.0, "elapsed_time": "0:04:07", "remaining_time": "0:33:25"} | |
| {"current_steps": 45, "total_steps": 400, "loss": 0.6218, "lr": 9.996954135095478e-07, "epoch": 11.290909090909091, "percentage": 11.25, "elapsed_time": "0:04:14", "remaining_time": "0:33:26"} | |
| {"current_steps": 46, "total_steps": 400, "loss": 0.603, "lr": 9.99524110790929e-07, "epoch": 11.581818181818182, "percentage": 11.5, "elapsed_time": "0:04:20", "remaining_time": "0:33:27"} | |
| {"current_steps": 47, "total_steps": 400, "loss": 0.7061, "lr": 9.99314767377287e-07, "epoch": 11.872727272727273, "percentage": 11.75, "elapsed_time": "0:04:27", "remaining_time": "0:33:31"} | |
| {"current_steps": 48, "total_steps": 400, "loss": 0.6531, "lr": 9.990673992109333e-07, "epoch": 12.0, "percentage": 12.0, "elapsed_time": "0:04:30", "remaining_time": "0:33:03"} | |
| {"current_steps": 49, "total_steps": 400, "loss": 0.6772, "lr": 9.98782025129912e-07, "epoch": 12.290909090909091, "percentage": 12.25, "elapsed_time": "0:04:36", "remaining_time": "0:33:03"} | |
| {"current_steps": 50, "total_steps": 400, "loss": 0.5937, "lr": 9.98458666866564e-07, "epoch": 12.581818181818182, "percentage": 12.5, "elapsed_time": "0:04:43", "remaining_time": "0:33:05"} | |
| {"current_steps": 51, "total_steps": 400, "loss": 0.6051, "lr": 9.980973490458728e-07, "epoch": 12.872727272727273, "percentage": 12.75, "elapsed_time": "0:04:49", "remaining_time": "0:33:03"} | |
| {"current_steps": 52, "total_steps": 400, "loss": 0.6327, "lr": 9.976980991835893e-07, "epoch": 13.0, "percentage": 13.0, "elapsed_time": "0:04:52", "remaining_time": "0:32:40"} | |
| {"current_steps": 53, "total_steps": 400, "loss": 0.6048, "lr": 9.972609476841365e-07, "epoch": 13.290909090909091, "percentage": 13.25, "elapsed_time": "0:04:59", "remaining_time": "0:32:40"} | |
| {"current_steps": 54, "total_steps": 400, "loss": 0.5989, "lr": 9.967859278382937e-07, "epoch": 13.581818181818182, "percentage": 13.5, "elapsed_time": "0:05:05", "remaining_time": "0:32:38"} | |
| {"current_steps": 55, "total_steps": 400, "loss": 0.5144, "lr": 9.96273075820661e-07, "epoch": 13.872727272727273, "percentage": 13.75, "elapsed_time": "0:05:12", "remaining_time": "0:32:40"} | |
| {"current_steps": 56, "total_steps": 400, "loss": 0.7319, "lr": 9.957224306869053e-07, "epoch": 14.0, "percentage": 14.0, "elapsed_time": "0:05:15", "remaining_time": "0:32:16"} | |
| {"current_steps": 57, "total_steps": 400, "loss": 0.5676, "lr": 9.95134034370785e-07, "epoch": 14.290909090909091, "percentage": 14.25, "elapsed_time": "0:05:22", "remaining_time": "0:32:20"} | |
| {"current_steps": 58, "total_steps": 400, "loss": 0.5846, "lr": 9.945079316809584e-07, "epoch": 14.581818181818182, "percentage": 14.5, "elapsed_time": "0:05:28", "remaining_time": "0:32:18"} | |
| {"current_steps": 59, "total_steps": 400, "loss": 0.602, "lr": 9.938441702975689e-07, "epoch": 14.872727272727273, "percentage": 14.75, "elapsed_time": "0:05:35", "remaining_time": "0:32:16"} | |
| {"current_steps": 60, "total_steps": 400, "loss": 0.503, "lr": 9.931428007686156e-07, "epoch": 15.0, "percentage": 15.0, "elapsed_time": "0:05:37", "remaining_time": "0:31:54"} | |
| {"current_steps": 61, "total_steps": 400, "loss": 0.535, "lr": 9.92403876506104e-07, "epoch": 15.290909090909091, "percentage": 15.25, "elapsed_time": "0:05:45", "remaining_time": "0:31:57"} | |
| {"current_steps": 62, "total_steps": 400, "loss": 0.5554, "lr": 9.916274537819773e-07, "epoch": 15.581818181818182, "percentage": 15.5, "elapsed_time": "0:05:50", "remaining_time": "0:31:53"} | |
| {"current_steps": 63, "total_steps": 400, "loss": 0.614, "lr": 9.90813591723832e-07, "epoch": 15.872727272727273, "percentage": 15.75, "elapsed_time": "0:05:57", "remaining_time": "0:31:53"} | |
| {"current_steps": 64, "total_steps": 400, "loss": 0.4917, "lr": 9.899623523104148e-07, "epoch": 16.0, "percentage": 16.0, "elapsed_time": "0:06:00", "remaining_time": "0:31:32"} | |
| {"current_steps": 65, "total_steps": 400, "loss": 0.5572, "lr": 9.890738003669027e-07, "epoch": 16.29090909090909, "percentage": 16.25, "elapsed_time": "0:06:07", "remaining_time": "0:31:34"} | |
| {"current_steps": 66, "total_steps": 400, "loss": 0.5196, "lr": 9.881480035599666e-07, "epoch": 16.581818181818182, "percentage": 16.5, "elapsed_time": "0:06:13", "remaining_time": "0:31:31"} | |
| {"current_steps": 67, "total_steps": 400, "loss": 0.5828, "lr": 9.871850323926177e-07, "epoch": 16.87272727272727, "percentage": 16.75, "elapsed_time": "0:06:20", "remaining_time": "0:31:30"} | |
| {"current_steps": 68, "total_steps": 400, "loss": 0.5128, "lr": 9.861849601988383e-07, "epoch": 17.0, "percentage": 17.0, "elapsed_time": "0:06:23", "remaining_time": "0:31:10"} | |
| {"current_steps": 69, "total_steps": 400, "loss": 0.5596, "lr": 9.851478631379982e-07, "epoch": 17.29090909090909, "percentage": 17.25, "elapsed_time": "0:06:29", "remaining_time": "0:31:09"} | |
| {"current_steps": 70, "total_steps": 400, "loss": 0.5787, "lr": 9.840738201890539e-07, "epoch": 17.581818181818182, "percentage": 17.5, "elapsed_time": "0:06:35", "remaining_time": "0:31:06"} | |
| {"current_steps": 71, "total_steps": 400, "loss": 0.4884, "lr": 9.82962913144534e-07, "epoch": 17.87272727272727, "percentage": 17.75, "elapsed_time": "0:06:42", "remaining_time": "0:31:03"} | |
| {"current_steps": 72, "total_steps": 400, "loss": 0.5233, "lr": 9.818152266043115e-07, "epoch": 18.0, "percentage": 18.0, "elapsed_time": "0:06:45", "remaining_time": "0:30:47"} | |
| {"current_steps": 73, "total_steps": 400, "loss": 0.5082, "lr": 9.806308479691594e-07, "epoch": 18.29090909090909, "percentage": 18.25, "elapsed_time": "0:06:52", "remaining_time": "0:30:46"} | |
| {"current_steps": 74, "total_steps": 400, "loss": 0.5583, "lr": 9.794098674340966e-07, "epoch": 18.581818181818182, "percentage": 18.5, "elapsed_time": "0:06:58", "remaining_time": "0:30:43"} | |
| {"current_steps": 75, "total_steps": 400, "loss": 0.5041, "lr": 9.781523779815178e-07, "epoch": 18.87272727272727, "percentage": 18.75, "elapsed_time": "0:07:05", "remaining_time": "0:30:42"} | |
| {"current_steps": 76, "total_steps": 400, "loss": 0.5379, "lr": 9.768584753741134e-07, "epoch": 19.0, "percentage": 19.0, "elapsed_time": "0:07:08", "remaining_time": "0:30:25"} | |
| {"current_steps": 77, "total_steps": 400, "loss": 0.5547, "lr": 9.755282581475767e-07, "epoch": 19.29090909090909, "percentage": 19.25, "elapsed_time": "0:07:14", "remaining_time": "0:30:22"} | |
| {"current_steps": 78, "total_steps": 400, "loss": 0.4499, "lr": 9.741618276030996e-07, "epoch": 19.581818181818182, "percentage": 19.5, "elapsed_time": "0:07:20", "remaining_time": "0:30:19"} | |
| {"current_steps": 79, "total_steps": 400, "loss": 0.5469, "lr": 9.727592877996584e-07, "epoch": 19.87272727272727, "percentage": 19.75, "elapsed_time": "0:07:27", "remaining_time": "0:30:18"} | |
| {"current_steps": 80, "total_steps": 400, "loss": 0.411, "lr": 9.713207455460892e-07, "epoch": 20.0, "percentage": 20.0, "elapsed_time": "0:07:30", "remaining_time": "0:30:02"} | |
| {"current_steps": 81, "total_steps": 400, "loss": 0.44, "lr": 9.698463103929541e-07, "epoch": 20.29090909090909, "percentage": 20.25, "elapsed_time": "0:07:37", "remaining_time": "0:30:01"} | |
| {"current_steps": 82, "total_steps": 400, "loss": 0.5108, "lr": 9.683360946241987e-07, "epoch": 20.581818181818182, "percentage": 20.5, "elapsed_time": "0:07:43", "remaining_time": "0:29:58"} | |
| {"current_steps": 83, "total_steps": 400, "loss": 0.509, "lr": 9.667902132486008e-07, "epoch": 20.87272727272727, "percentage": 20.75, "elapsed_time": "0:07:49", "remaining_time": "0:29:53"} | |
| {"current_steps": 84, "total_steps": 400, "loss": 0.518, "lr": 9.652087839910123e-07, "epoch": 21.0, "percentage": 21.0, "elapsed_time": "0:07:53", "remaining_time": "0:29:39"} | |
| {"current_steps": 85, "total_steps": 400, "loss": 0.5221, "lr": 9.635919272833937e-07, "epoch": 21.29090909090909, "percentage": 21.25, "elapsed_time": "0:08:00", "remaining_time": "0:29:40"} | |
| {"current_steps": 86, "total_steps": 400, "loss": 0.488, "lr": 9.619397662556433e-07, "epoch": 21.581818181818182, "percentage": 21.5, "elapsed_time": "0:08:06", "remaining_time": "0:29:35"} | |
| {"current_steps": 87, "total_steps": 400, "loss": 0.4174, "lr": 9.602524267262202e-07, "epoch": 21.87272727272727, "percentage": 21.75, "elapsed_time": "0:08:12", "remaining_time": "0:29:33"} | |
| {"current_steps": 88, "total_steps": 400, "loss": 0.4586, "lr": 9.58530037192562e-07, "epoch": 22.0, "percentage": 22.0, "elapsed_time": "0:08:15", "remaining_time": "0:29:16"} | |
| {"current_steps": 89, "total_steps": 400, "loss": 0.4392, "lr": 9.567727288213004e-07, "epoch": 22.29090909090909, "percentage": 22.25, "elapsed_time": "0:08:21", "remaining_time": "0:29:13"} | |
| {"current_steps": 90, "total_steps": 400, "loss": 0.475, "lr": 9.549806354382715e-07, "epoch": 22.581818181818182, "percentage": 22.5, "elapsed_time": "0:08:27", "remaining_time": "0:29:09"} | |
| {"current_steps": 91, "total_steps": 400, "loss": 0.4617, "lr": 9.531538935183249e-07, "epoch": 22.87272727272727, "percentage": 22.75, "elapsed_time": "0:08:34", "remaining_time": "0:29:06"} | |
| {"current_steps": 92, "total_steps": 400, "loss": 0.4534, "lr": 9.512926421749303e-07, "epoch": 23.0, "percentage": 23.0, "elapsed_time": "0:08:37", "remaining_time": "0:28:53"} | |
| {"current_steps": 93, "total_steps": 400, "loss": 0.4567, "lr": 9.493970231495834e-07, "epoch": 23.29090909090909, "percentage": 23.25, "elapsed_time": "0:08:44", "remaining_time": "0:28:51"} | |
| {"current_steps": 94, "total_steps": 400, "loss": 0.4521, "lr": 9.474671808010125e-07, "epoch": 23.581818181818182, "percentage": 23.5, "elapsed_time": "0:08:50", "remaining_time": "0:28:46"} | |
| {"current_steps": 95, "total_steps": 400, "loss": 0.4221, "lr": 9.455032620941839e-07, "epoch": 23.87272727272727, "percentage": 23.75, "elapsed_time": "0:08:57", "remaining_time": "0:28:44"} | |
| {"current_steps": 96, "total_steps": 400, "loss": 0.4577, "lr": 9.435054165891108e-07, "epoch": 24.0, "percentage": 24.0, "elapsed_time": "0:09:00", "remaining_time": "0:28:30"} | |
| {"current_steps": 97, "total_steps": 400, "loss": 0.4536, "lr": 9.414737964294634e-07, "epoch": 24.29090909090909, "percentage": 24.25, "elapsed_time": "0:09:06", "remaining_time": "0:28:28"} | |
| {"current_steps": 98, "total_steps": 400, "loss": 0.4085, "lr": 9.394085563309826e-07, "epoch": 24.581818181818182, "percentage": 24.5, "elapsed_time": "0:09:13", "remaining_time": "0:28:24"} | |
| {"current_steps": 99, "total_steps": 400, "loss": 0.4102, "lr": 9.373098535696978e-07, "epoch": 24.87272727272727, "percentage": 24.75, "elapsed_time": "0:09:19", "remaining_time": "0:28:21"} | |
| {"current_steps": 100, "total_steps": 400, "loss": 0.4833, "lr": 9.351778479699498e-07, "epoch": 25.0, "percentage": 25.0, "elapsed_time": "0:09:22", "remaining_time": "0:28:07"} | |
| {"current_steps": 100, "total_steps": 400, "eval_loss": 0.5104968547821045, "epoch": 25.0, "percentage": 25.0, "elapsed_time": "0:09:23", "remaining_time": "0:28:09"} | |
| {"current_steps": 101, "total_steps": 400, "loss": 0.4385, "lr": 9.330127018922193e-07, "epoch": 25.29090909090909, "percentage": 25.25, "elapsed_time": "0:09:29", "remaining_time": "0:28:06"} | |
| {"current_steps": 102, "total_steps": 400, "loss": 0.4111, "lr": 9.308145802207628e-07, "epoch": 25.581818181818182, "percentage": 25.5, "elapsed_time": "0:09:35", "remaining_time": "0:28:02"} | |
| {"current_steps": 103, "total_steps": 400, "loss": 0.3836, "lr": 9.285836503510562e-07, "epoch": 25.87272727272727, "percentage": 25.75, "elapsed_time": "0:09:42", "remaining_time": "0:27:59"} | |
| {"current_steps": 104, "total_steps": 400, "loss": 0.4733, "lr": 9.26320082177046e-07, "epoch": 26.0, "percentage": 26.0, "elapsed_time": "0:09:45", "remaining_time": "0:27:46"} | |
| {"current_steps": 105, "total_steps": 400, "loss": 0.4069, "lr": 9.240240480782129e-07, "epoch": 26.29090909090909, "percentage": 26.25, "elapsed_time": "0:09:52", "remaining_time": "0:27:43"} | |
| {"current_steps": 106, "total_steps": 400, "loss": 0.3598, "lr": 9.216957229064428e-07, "epoch": 26.581818181818182, "percentage": 26.5, "elapsed_time": "0:09:58", "remaining_time": "0:27:40"} | |
| {"current_steps": 107, "total_steps": 400, "loss": 0.4266, "lr": 9.19335283972712e-07, "epoch": 26.87272727272727, "percentage": 26.75, "elapsed_time": "0:10:04", "remaining_time": "0:27:36"} | |
| {"current_steps": 108, "total_steps": 400, "loss": 0.4543, "lr": 9.16942911033584e-07, "epoch": 27.0, "percentage": 27.0, "elapsed_time": "0:10:07", "remaining_time": "0:27:23"} | |
| {"current_steps": 109, "total_steps": 400, "loss": 0.4112, "lr": 9.145187862775208e-07, "epoch": 27.29090909090909, "percentage": 27.25, "elapsed_time": "0:10:14", "remaining_time": "0:27:20"} | |
| {"current_steps": 110, "total_steps": 400, "loss": 0.3953, "lr": 9.120630943110077e-07, "epoch": 27.581818181818182, "percentage": 27.5, "elapsed_time": "0:10:20", "remaining_time": "0:27:16"} | |
| {"current_steps": 111, "total_steps": 400, "loss": 0.3892, "lr": 9.095760221444959e-07, "epoch": 27.87272727272727, "percentage": 27.75, "elapsed_time": "0:10:27", "remaining_time": "0:27:14"} | |
| {"current_steps": 112, "total_steps": 400, "loss": 0.3663, "lr": 9.070577591781597e-07, "epoch": 28.0, "percentage": 28.0, "elapsed_time": "0:10:30", "remaining_time": "0:27:00"} | |
| {"current_steps": 113, "total_steps": 400, "loss": 0.4199, "lr": 9.045084971874737e-07, "epoch": 28.29090909090909, "percentage": 28.25, "elapsed_time": "0:10:37", "remaining_time": "0:26:58"} | |
| {"current_steps": 114, "total_steps": 400, "loss": 0.3542, "lr": 9.019284303086085e-07, "epoch": 28.581818181818182, "percentage": 28.5, "elapsed_time": "0:10:43", "remaining_time": "0:26:54"} | |
| {"current_steps": 115, "total_steps": 400, "loss": 0.3823, "lr": 8.993177550236463e-07, "epoch": 28.87272727272727, "percentage": 28.75, "elapsed_time": "0:10:49", "remaining_time": "0:26:50"} | |
| {"current_steps": 116, "total_steps": 400, "loss": 0.3442, "lr": 8.966766701456176e-07, "epoch": 29.0, "percentage": 29.0, "elapsed_time": "0:10:52", "remaining_time": "0:26:38"} | |
| {"current_steps": 117, "total_steps": 400, "loss": 0.335, "lr": 8.940053768033608e-07, "epoch": 29.29090909090909, "percentage": 29.25, "elapsed_time": "0:10:59", "remaining_time": "0:26:34"} | |
| {"current_steps": 118, "total_steps": 400, "loss": 0.4149, "lr": 8.913040784262069e-07, "epoch": 29.581818181818182, "percentage": 29.5, "elapsed_time": "0:11:06", "remaining_time": "0:26:31"} | |
| {"current_steps": 119, "total_steps": 400, "loss": 0.3765, "lr": 8.885729807284854e-07, "epoch": 29.87272727272727, "percentage": 29.75, "elapsed_time": "0:11:11", "remaining_time": "0:26:26"} | |
| {"current_steps": 120, "total_steps": 400, "loss": 0.3431, "lr": 8.858122916938599e-07, "epoch": 30.0, "percentage": 30.0, "elapsed_time": "0:11:15", "remaining_time": "0:26:15"} | |
| {"current_steps": 121, "total_steps": 400, "loss": 0.3791, "lr": 8.83022221559489e-07, "epoch": 30.29090909090909, "percentage": 30.25, "elapsed_time": "0:11:21", "remaining_time": "0:26:12"} | |
| {"current_steps": 122, "total_steps": 400, "loss": 0.3341, "lr": 8.802029828000155e-07, "epoch": 30.581818181818182, "percentage": 30.5, "elapsed_time": "0:11:28", "remaining_time": "0:26:09"} | |
| {"current_steps": 123, "total_steps": 400, "loss": 0.3987, "lr": 8.773547901113861e-07, "epoch": 30.87272727272727, "percentage": 30.75, "elapsed_time": "0:11:34", "remaining_time": "0:26:04"} | |
| {"current_steps": 124, "total_steps": 400, "loss": 0.3045, "lr": 8.744778603945011e-07, "epoch": 31.0, "percentage": 31.0, "elapsed_time": "0:11:37", "remaining_time": "0:25:52"} | |
| {"current_steps": 125, "total_steps": 400, "loss": 0.3322, "lr": 8.71572412738697e-07, "epoch": 31.29090909090909, "percentage": 31.25, "elapsed_time": "0:11:44", "remaining_time": "0:25:49"} | |
| {"current_steps": 126, "total_steps": 400, "loss": 0.3678, "lr": 8.68638668405062e-07, "epoch": 31.581818181818182, "percentage": 31.5, "elapsed_time": "0:11:50", "remaining_time": "0:25:45"} | |
| {"current_steps": 127, "total_steps": 400, "loss": 0.3699, "lr": 8.656768508095852e-07, "epoch": 31.87272727272727, "percentage": 31.75, "elapsed_time": "0:11:57", "remaining_time": "0:25:42"} | |
| {"current_steps": 128, "total_steps": 400, "loss": 0.2941, "lr": 8.626871855061437e-07, "epoch": 32.0, "percentage": 32.0, "elapsed_time": "0:12:00", "remaining_time": "0:25:30"} | |
| {"current_steps": 129, "total_steps": 400, "loss": 0.3305, "lr": 8.596699001693255e-07, "epoch": 32.29090909090909, "percentage": 32.25, "elapsed_time": "0:12:06", "remaining_time": "0:25:26"} | |
| {"current_steps": 130, "total_steps": 400, "loss": 0.3296, "lr": 8.566252245770907e-07, "epoch": 32.58181818181818, "percentage": 32.5, "elapsed_time": "0:12:13", "remaining_time": "0:25:23"} | |
| {"current_steps": 131, "total_steps": 400, "loss": 0.3332, "lr": 8.535533905932737e-07, "epoch": 32.872727272727275, "percentage": 32.75, "elapsed_time": "0:12:19", "remaining_time": "0:25:18"} | |
| {"current_steps": 132, "total_steps": 400, "loss": 0.3683, "lr": 8.504546321499254e-07, "epoch": 33.0, "percentage": 33.0, "elapsed_time": "0:12:22", "remaining_time": "0:25:07"} | |
| {"current_steps": 133, "total_steps": 400, "loss": 0.3776, "lr": 8.473291852294986e-07, "epoch": 33.29090909090909, "percentage": 33.25, "elapsed_time": "0:12:29", "remaining_time": "0:25:05"} | |
| {"current_steps": 134, "total_steps": 400, "loss": 0.3213, "lr": 8.441772878468769e-07, "epoch": 33.58181818181818, "percentage": 33.5, "elapsed_time": "0:12:36", "remaining_time": "0:25:01"} | |
| {"current_steps": 135, "total_steps": 400, "loss": 0.2998, "lr": 8.409991800312492e-07, "epoch": 33.872727272727275, "percentage": 33.75, "elapsed_time": "0:12:42", "remaining_time": "0:24:56"} | |
| {"current_steps": 136, "total_steps": 400, "loss": 0.2756, "lr": 8.377951038078301e-07, "epoch": 34.0, "percentage": 34.0, "elapsed_time": "0:12:45", "remaining_time": "0:24:45"} | |
| {"current_steps": 137, "total_steps": 400, "loss": 0.3056, "lr": 8.34565303179429e-07, "epoch": 34.29090909090909, "percentage": 34.25, "elapsed_time": "0:12:51", "remaining_time": "0:24:41"} | |
| {"current_steps": 138, "total_steps": 400, "loss": 0.3238, "lr": 8.313100241078687e-07, "epoch": 34.58181818181818, "percentage": 34.5, "elapsed_time": "0:12:58", "remaining_time": "0:24:37"} | |
| {"current_steps": 139, "total_steps": 400, "loss": 0.3317, "lr": 8.280295144952536e-07, "epoch": 34.872727272727275, "percentage": 34.75, "elapsed_time": "0:13:04", "remaining_time": "0:24:33"} | |
| {"current_steps": 140, "total_steps": 400, "loss": 0.2969, "lr": 8.247240241650917e-07, "epoch": 35.0, "percentage": 35.0, "elapsed_time": "0:13:07", "remaining_time": "0:24:22"} | |
| {"current_steps": 141, "total_steps": 400, "loss": 0.2916, "lr": 8.213938048432696e-07, "epoch": 35.29090909090909, "percentage": 35.25, "elapsed_time": "0:13:14", "remaining_time": "0:24:19"} | |
| {"current_steps": 142, "total_steps": 400, "loss": 0.3357, "lr": 8.180391101388819e-07, "epoch": 35.58181818181818, "percentage": 35.5, "elapsed_time": "0:13:21", "remaining_time": "0:24:15"} | |
| {"current_steps": 143, "total_steps": 400, "loss": 0.2653, "lr": 8.146601955249187e-07, "epoch": 35.872727272727275, "percentage": 35.75, "elapsed_time": "0:13:27", "remaining_time": "0:24:10"} | |
| {"current_steps": 144, "total_steps": 400, "loss": 0.3746, "lr": 8.112573183188098e-07, "epoch": 36.0, "percentage": 36.0, "elapsed_time": "0:13:29", "remaining_time": "0:23:59"} | |
| {"current_steps": 145, "total_steps": 400, "loss": 0.3263, "lr": 8.07830737662829e-07, "epoch": 36.29090909090909, "percentage": 36.25, "elapsed_time": "0:13:36", "remaining_time": "0:23:55"} | |
| {"current_steps": 146, "total_steps": 400, "loss": 0.272, "lr": 8.043807145043603e-07, "epoch": 36.58181818181818, "percentage": 36.5, "elapsed_time": "0:13:43", "remaining_time": "0:23:52"} | |
| {"current_steps": 147, "total_steps": 400, "loss": 0.3184, "lr": 8.009075115760242e-07, "epoch": 36.872727272727275, "percentage": 36.75, "elapsed_time": "0:13:49", "remaining_time": "0:23:48"} | |
| {"current_steps": 148, "total_steps": 400, "loss": 0.255, "lr": 7.974113933756707e-07, "epoch": 37.0, "percentage": 37.0, "elapsed_time": "0:13:52", "remaining_time": "0:23:37"} | |
| {"current_steps": 149, "total_steps": 400, "loss": 0.2887, "lr": 7.938926261462365e-07, "epoch": 37.29090909090909, "percentage": 37.25, "elapsed_time": "0:13:59", "remaining_time": "0:23:33"} | |
| {"current_steps": 150, "total_steps": 400, "loss": 0.2879, "lr": 7.903514778554699e-07, "epoch": 37.58181818181818, "percentage": 37.5, "elapsed_time": "0:14:05", "remaining_time": "0:23:28"} | |
| {"current_steps": 151, "total_steps": 400, "loss": 0.288, "lr": 7.86788218175523e-07, "epoch": 37.872727272727275, "percentage": 37.75, "elapsed_time": "0:14:12", "remaining_time": "0:23:25"} | |
| {"current_steps": 152, "total_steps": 400, "loss": 0.3232, "lr": 7.832031184624164e-07, "epoch": 38.0, "percentage": 38.0, "elapsed_time": "0:14:14", "remaining_time": "0:23:14"} | |
| {"current_steps": 153, "total_steps": 400, "loss": 0.2611, "lr": 7.795964517353733e-07, "epoch": 38.29090909090909, "percentage": 38.25, "elapsed_time": "0:14:21", "remaining_time": "0:23:10"} | |
| {"current_steps": 154, "total_steps": 400, "loss": 0.2767, "lr": 7.75968492656029e-07, "epoch": 38.58181818181818, "percentage": 38.5, "elapsed_time": "0:14:27", "remaining_time": "0:23:06"} | |
| {"current_steps": 155, "total_steps": 400, "loss": 0.3047, "lr": 7.723195175075135e-07, "epoch": 38.872727272727275, "percentage": 38.75, "elapsed_time": "0:14:34", "remaining_time": "0:23:02"} | |
| {"current_steps": 156, "total_steps": 400, "loss": 0.2922, "lr": 7.68649804173412e-07, "epoch": 39.0, "percentage": 39.0, "elapsed_time": "0:14:37", "remaining_time": "0:22:52"} | |
| {"current_steps": 157, "total_steps": 400, "loss": 0.2588, "lr": 7.649596321166024e-07, "epoch": 39.29090909090909, "percentage": 39.25, "elapsed_time": "0:14:43", "remaining_time": "0:22:47"} | |
| {"current_steps": 158, "total_steps": 400, "loss": 0.2772, "lr": 7.612492823579744e-07, "epoch": 39.58181818181818, "percentage": 39.5, "elapsed_time": "0:14:50", "remaining_time": "0:22:43"} | |
| {"current_steps": 159, "total_steps": 400, "loss": 0.289, "lr": 7.575190374550271e-07, "epoch": 39.872727272727275, "percentage": 39.75, "elapsed_time": "0:14:56", "remaining_time": "0:22:39"} | |
| {"current_steps": 160, "total_steps": 400, "loss": 0.2756, "lr": 7.537691814803521e-07, "epoch": 40.0, "percentage": 40.0, "elapsed_time": "0:14:59", "remaining_time": "0:22:29"} | |
| {"current_steps": 161, "total_steps": 400, "loss": 0.2694, "lr": 7.5e-07, "epoch": 40.29090909090909, "percentage": 40.25, "elapsed_time": "0:15:06", "remaining_time": "0:22:25"} | |
| {"current_steps": 162, "total_steps": 400, "loss": 0.2919, "lr": 7.462117800517336e-07, "epoch": 40.58181818181818, "percentage": 40.5, "elapsed_time": "0:15:12", "remaining_time": "0:22:20"} | |
| {"current_steps": 163, "total_steps": 400, "loss": 0.2595, "lr": 7.424048101231686e-07, "epoch": 40.872727272727275, "percentage": 40.75, "elapsed_time": "0:15:18", "remaining_time": "0:22:15"} | |
| {"current_steps": 164, "total_steps": 400, "loss": 0.2377, "lr": 7.385793801298042e-07, "epoch": 41.0, "percentage": 41.0, "elapsed_time": "0:15:22", "remaining_time": "0:22:06"} | |
| {"current_steps": 165, "total_steps": 400, "loss": 0.2574, "lr": 7.347357813929454e-07, "epoch": 41.29090909090909, "percentage": 41.25, "elapsed_time": "0:15:28", "remaining_time": "0:22:02"} | |
| {"current_steps": 166, "total_steps": 400, "loss": 0.2651, "lr": 7.30874306617517e-07, "epoch": 41.58181818181818, "percentage": 41.5, "elapsed_time": "0:15:35", "remaining_time": "0:21:58"} | |
| {"current_steps": 167, "total_steps": 400, "loss": 0.2475, "lr": 7.269952498697734e-07, "epoch": 41.872727272727275, "percentage": 41.75, "elapsed_time": "0:15:41", "remaining_time": "0:21:53"} | |
| {"current_steps": 168, "total_steps": 400, "loss": 0.3012, "lr": 7.230989065549044e-07, "epoch": 42.0, "percentage": 42.0, "elapsed_time": "0:15:44", "remaining_time": "0:21:44"} | |
| {"current_steps": 169, "total_steps": 400, "loss": 0.2441, "lr": 7.191855733945386e-07, "epoch": 42.29090909090909, "percentage": 42.25, "elapsed_time": "0:15:51", "remaining_time": "0:21:40"} | |
| {"current_steps": 170, "total_steps": 400, "loss": 0.282, "lr": 7.152555484041475e-07, "epoch": 42.58181818181818, "percentage": 42.5, "elapsed_time": "0:15:57", "remaining_time": "0:21:36"} | |
| {"current_steps": 171, "total_steps": 400, "loss": 0.2546, "lr": 7.113091308703497e-07, "epoch": 42.872727272727275, "percentage": 42.75, "elapsed_time": "0:16:04", "remaining_time": "0:21:31"} | |
| {"current_steps": 172, "total_steps": 400, "loss": 0.2248, "lr": 7.073466213281195e-07, "epoch": 43.0, "percentage": 43.0, "elapsed_time": "0:16:07", "remaining_time": "0:21:21"} | |
| {"current_steps": 173, "total_steps": 400, "loss": 0.2587, "lr": 7.033683215379002e-07, "epoch": 43.29090909090909, "percentage": 43.25, "elapsed_time": "0:16:13", "remaining_time": "0:21:17"} | |
| {"current_steps": 174, "total_steps": 400, "loss": 0.2566, "lr": 6.993745344626231e-07, "epoch": 43.58181818181818, "percentage": 43.5, "elapsed_time": "0:16:20", "remaining_time": "0:21:13"} | |
| {"current_steps": 175, "total_steps": 400, "loss": 0.2104, "lr": 6.953655642446367e-07, "epoch": 43.872727272727275, "percentage": 43.75, "elapsed_time": "0:16:26", "remaining_time": "0:21:08"} | |
| {"current_steps": 176, "total_steps": 400, "loss": 0.2926, "lr": 6.913417161825449e-07, "epoch": 44.0, "percentage": 44.0, "elapsed_time": "0:16:29", "remaining_time": "0:20:59"} | |
| {"current_steps": 177, "total_steps": 400, "loss": 0.2293, "lr": 6.87303296707956e-07, "epoch": 44.29090909090909, "percentage": 44.25, "elapsed_time": "0:16:36", "remaining_time": "0:20:55"} | |
| {"current_steps": 178, "total_steps": 400, "loss": 0.2878, "lr": 6.832506133621486e-07, "epoch": 44.58181818181818, "percentage": 44.5, "elapsed_time": "0:16:43", "remaining_time": "0:20:51"} | |
| {"current_steps": 179, "total_steps": 400, "loss": 0.208, "lr": 6.7918397477265e-07, "epoch": 44.872727272727275, "percentage": 44.75, "elapsed_time": "0:16:49", "remaining_time": "0:20:46"} | |
| {"current_steps": 180, "total_steps": 400, "loss": 0.2434, "lr": 6.751036906297337e-07, "epoch": 45.0, "percentage": 45.0, "elapsed_time": "0:16:52", "remaining_time": "0:20:37"} | |
| {"current_steps": 181, "total_steps": 400, "loss": 0.2202, "lr": 6.710100716628344e-07, "epoch": 45.29090909090909, "percentage": 45.25, "elapsed_time": "0:16:58", "remaining_time": "0:20:32"} | |
| {"current_steps": 182, "total_steps": 400, "loss": 0.2474, "lr": 6.669034296168854e-07, "epoch": 45.58181818181818, "percentage": 45.5, "elapsed_time": "0:17:05", "remaining_time": "0:20:28"} | |
| {"current_steps": 183, "total_steps": 400, "loss": 0.2362, "lr": 6.627840772285783e-07, "epoch": 45.872727272727275, "percentage": 45.75, "elapsed_time": "0:17:12", "remaining_time": "0:20:23"} | |
| {"current_steps": 184, "total_steps": 400, "loss": 0.2169, "lr": 6.586523282025461e-07, "epoch": 46.0, "percentage": 46.0, "elapsed_time": "0:17:14", "remaining_time": "0:20:14"} | |
| {"current_steps": 185, "total_steps": 400, "loss": 0.2167, "lr": 6.545084971874736e-07, "epoch": 46.29090909090909, "percentage": 46.25, "elapsed_time": "0:17:21", "remaining_time": "0:20:10"} | |
| {"current_steps": 186, "total_steps": 400, "loss": 0.2181, "lr": 6.503528997521364e-07, "epoch": 46.58181818181818, "percentage": 46.5, "elapsed_time": "0:17:27", "remaining_time": "0:20:05"} | |
| {"current_steps": 187, "total_steps": 400, "loss": 0.2453, "lr": 6.461858523613684e-07, "epoch": 46.872727272727275, "percentage": 46.75, "elapsed_time": "0:17:34", "remaining_time": "0:20:01"} | |
| {"current_steps": 188, "total_steps": 400, "loss": 0.2183, "lr": 6.420076723519614e-07, "epoch": 47.0, "percentage": 47.0, "elapsed_time": "0:17:37", "remaining_time": "0:19:52"} | |
| {"current_steps": 189, "total_steps": 400, "loss": 0.2127, "lr": 6.378186779084995e-07, "epoch": 47.29090909090909, "percentage": 47.25, "elapsed_time": "0:17:43", "remaining_time": "0:19:47"} | |
| {"current_steps": 190, "total_steps": 400, "loss": 0.2061, "lr": 6.336191880391284e-07, "epoch": 47.58181818181818, "percentage": 47.5, "elapsed_time": "0:17:50", "remaining_time": "0:19:42"} | |
| {"current_steps": 191, "total_steps": 400, "loss": 0.2497, "lr": 6.294095225512604e-07, "epoch": 47.872727272727275, "percentage": 47.75, "elapsed_time": "0:17:56", "remaining_time": "0:19:38"} | |
| {"current_steps": 192, "total_steps": 400, "loss": 0.1899, "lr": 6.251900020272207e-07, "epoch": 48.0, "percentage": 48.0, "elapsed_time": "0:17:59", "remaining_time": "0:19:29"} | |
| {"current_steps": 193, "total_steps": 400, "loss": 0.2159, "lr": 6.209609477998338e-07, "epoch": 48.29090909090909, "percentage": 48.25, "elapsed_time": "0:18:06", "remaining_time": "0:19:24"} | |
| {"current_steps": 194, "total_steps": 400, "loss": 0.2476, "lr": 6.167226819279527e-07, "epoch": 48.58181818181818, "percentage": 48.5, "elapsed_time": "0:18:12", "remaining_time": "0:19:20"} | |
| {"current_steps": 195, "total_steps": 400, "loss": 0.1801, "lr": 6.124755271719326e-07, "epoch": 48.872727272727275, "percentage": 48.75, "elapsed_time": "0:18:19", "remaining_time": "0:19:15"} | |
| {"current_steps": 196, "total_steps": 400, "loss": 0.1941, "lr": 6.082198069690514e-07, "epoch": 49.0, "percentage": 49.0, "elapsed_time": "0:18:22", "remaining_time": "0:19:07"} | |
| {"current_steps": 197, "total_steps": 400, "loss": 0.207, "lr": 6.039558454088795e-07, "epoch": 49.29090909090909, "percentage": 49.25, "elapsed_time": "0:18:28", "remaining_time": "0:19:02"} | |
| {"current_steps": 198, "total_steps": 400, "loss": 0.17, "lr": 5.996839672085986e-07, "epoch": 49.58181818181818, "percentage": 49.5, "elapsed_time": "0:18:34", "remaining_time": "0:18:57"} | |
| {"current_steps": 199, "total_steps": 400, "loss": 0.2268, "lr": 5.954044976882723e-07, "epoch": 49.872727272727275, "percentage": 49.75, "elapsed_time": "0:18:41", "remaining_time": "0:18:53"} | |
| {"current_steps": 200, "total_steps": 400, "loss": 0.2013, "lr": 5.911177627460738e-07, "epoch": 50.0, "percentage": 50.0, "elapsed_time": "0:18:44", "remaining_time": "0:18:44"} | |
| {"current_steps": 200, "total_steps": 400, "eval_loss": 0.6481181383132935, "epoch": 50.0, "percentage": 50.0, "elapsed_time": "0:18:45", "remaining_time": "0:18:45"} | |
| {"current_steps": 201, "total_steps": 400, "loss": 0.2331, "lr": 5.868240888334652e-07, "epoch": 50.29090909090909, "percentage": 50.25, "elapsed_time": "0:19:12", "remaining_time": "0:19:01"} | |
| {"current_steps": 202, "total_steps": 400, "loss": 0.1794, "lr": 5.825238029303387e-07, "epoch": 50.58181818181818, "percentage": 50.5, "elapsed_time": "0:19:19", "remaining_time": "0:18:56"} | |
| {"current_steps": 203, "total_steps": 400, "loss": 0.1981, "lr": 5.782172325201155e-07, "epoch": 50.872727272727275, "percentage": 50.75, "elapsed_time": "0:19:25", "remaining_time": "0:18:51"} | |
| {"current_steps": 204, "total_steps": 400, "loss": 0.1279, "lr": 5.739047055648054e-07, "epoch": 51.0, "percentage": 51.0, "elapsed_time": "0:19:28", "remaining_time": "0:18:42"} | |
| {"current_steps": 205, "total_steps": 400, "loss": 0.218, "lr": 5.695865504800327e-07, "epoch": 51.29090909090909, "percentage": 51.25, "elapsed_time": "0:19:35", "remaining_time": "0:18:38"} | |
| {"current_steps": 206, "total_steps": 400, "loss": 0.1534, "lr": 5.652630961100258e-07, "epoch": 51.58181818181818, "percentage": 51.5, "elapsed_time": "0:19:41", "remaining_time": "0:18:32"} | |
| {"current_steps": 207, "total_steps": 400, "loss": 0.1948, "lr": 5.609346717025737e-07, "epoch": 51.872727272727275, "percentage": 51.75, "elapsed_time": "0:19:48", "remaining_time": "0:18:28"} | |
| {"current_steps": 208, "total_steps": 400, "loss": 0.1769, "lr": 5.566016068839534e-07, "epoch": 52.0, "percentage": 52.0, "elapsed_time": "0:19:51", "remaining_time": "0:18:19"} | |
| {"current_steps": 209, "total_steps": 400, "loss": 0.1619, "lr": 5.522642316338268e-07, "epoch": 52.29090909090909, "percentage": 52.25, "elapsed_time": "0:19:58", "remaining_time": "0:18:14"} | |
| {"current_steps": 210, "total_steps": 400, "loss": 0.2259, "lr": 5.47922876260112e-07, "epoch": 52.58181818181818, "percentage": 52.5, "elapsed_time": "0:20:04", "remaining_time": "0:18:10"} | |
| {"current_steps": 211, "total_steps": 400, "loss": 0.164, "lr": 5.435778713738292e-07, "epoch": 52.872727272727275, "percentage": 52.75, "elapsed_time": "0:20:11", "remaining_time": "0:18:05"} | |
| {"current_steps": 212, "total_steps": 400, "loss": 0.1561, "lr": 5.392295478639225e-07, "epoch": 53.0, "percentage": 53.0, "elapsed_time": "0:20:14", "remaining_time": "0:17:56"} | |
| {"current_steps": 213, "total_steps": 400, "loss": 0.1655, "lr": 5.348782368720625e-07, "epoch": 53.29090909090909, "percentage": 53.25, "elapsed_time": "0:20:20", "remaining_time": "0:17:51"} | |
| {"current_steps": 214, "total_steps": 400, "loss": 0.1606, "lr": 5.305242697674285e-07, "epoch": 53.58181818181818, "percentage": 53.5, "elapsed_time": "0:20:27", "remaining_time": "0:17:47"} | |
| {"current_steps": 215, "total_steps": 400, "loss": 0.1846, "lr": 5.26167978121472e-07, "epoch": 53.872727272727275, "percentage": 53.75, "elapsed_time": "0:20:33", "remaining_time": "0:17:41"} | |
| {"current_steps": 216, "total_steps": 400, "loss": 0.2143, "lr": 5.21809693682668e-07, "epoch": 54.0, "percentage": 54.0, "elapsed_time": "0:20:36", "remaining_time": "0:17:33"} | |
| {"current_steps": 217, "total_steps": 400, "loss": 0.1547, "lr": 5.174497483512505e-07, "epoch": 54.29090909090909, "percentage": 54.25, "elapsed_time": "0:20:43", "remaining_time": "0:17:28"} | |
| {"current_steps": 218, "total_steps": 400, "loss": 0.1874, "lr": 5.130884741539366e-07, "epoch": 54.58181818181818, "percentage": 54.5, "elapsed_time": "0:20:50", "remaining_time": "0:17:23"} | |
| {"current_steps": 219, "total_steps": 400, "loss": 0.165, "lr": 5.087262032186418e-07, "epoch": 54.872727272727275, "percentage": 54.75, "elapsed_time": "0:20:56", "remaining_time": "0:17:18"} | |
| {"current_steps": 220, "total_steps": 400, "loss": 0.1532, "lr": 5.043632677491869e-07, "epoch": 55.0, "percentage": 55.0, "elapsed_time": "0:20:59", "remaining_time": "0:17:10"} | |
| {"current_steps": 221, "total_steps": 400, "loss": 0.1514, "lr": 5e-07, "epoch": 55.29090909090909, "percentage": 55.25, "elapsed_time": "0:21:05", "remaining_time": "0:17:05"} | |
| {"current_steps": 222, "total_steps": 400, "loss": 0.1477, "lr": 4.956367322508131e-07, "epoch": 55.58181818181818, "percentage": 55.5, "elapsed_time": "0:21:12", "remaining_time": "0:17:00"} | |
| {"current_steps": 223, "total_steps": 400, "loss": 0.1733, "lr": 4.912737967813582e-07, "epoch": 55.872727272727275, "percentage": 55.75, "elapsed_time": "0:21:19", "remaining_time": "0:16:55"} | |
| {"current_steps": 224, "total_steps": 400, "loss": 0.171, "lr": 4.869115258460634e-07, "epoch": 56.0, "percentage": 56.0, "elapsed_time": "0:21:22", "remaining_time": "0:16:47"} | |
| {"current_steps": 225, "total_steps": 400, "loss": 0.1914, "lr": 4.825502516487496e-07, "epoch": 56.29090909090909, "percentage": 56.25, "elapsed_time": "0:21:28", "remaining_time": "0:16:42"} | |
| {"current_steps": 226, "total_steps": 400, "loss": 0.1517, "lr": 4.78190306317332e-07, "epoch": 56.58181818181818, "percentage": 56.5, "elapsed_time": "0:21:35", "remaining_time": "0:16:37"} | |
| {"current_steps": 227, "total_steps": 400, "loss": 0.1187, "lr": 4.7383202187852804e-07, "epoch": 56.872727272727275, "percentage": 56.75, "elapsed_time": "0:21:41", "remaining_time": "0:16:32"} | |
| {"current_steps": 228, "total_steps": 400, "loss": 0.1476, "lr": 4.694757302325715e-07, "epoch": 57.0, "percentage": 57.0, "elapsed_time": "0:21:44", "remaining_time": "0:16:24"} | |
| {"current_steps": 229, "total_steps": 400, "loss": 0.1686, "lr": 4.6512176312793735e-07, "epoch": 57.29090909090909, "percentage": 57.25, "elapsed_time": "0:21:50", "remaining_time": "0:16:18"} | |
| {"current_steps": 230, "total_steps": 400, "loss": 0.1176, "lr": 4.6077045213607755e-07, "epoch": 57.58181818181818, "percentage": 57.5, "elapsed_time": "0:21:57", "remaining_time": "0:16:13"} | |
| {"current_steps": 231, "total_steps": 400, "loss": 0.1597, "lr": 4.5642212862617085e-07, "epoch": 57.872727272727275, "percentage": 57.75, "elapsed_time": "0:22:03", "remaining_time": "0:16:08"} | |
| {"current_steps": 232, "total_steps": 400, "loss": 0.1334, "lr": 4.52077123739888e-07, "epoch": 58.0, "percentage": 58.0, "elapsed_time": "0:22:06", "remaining_time": "0:16:00"} | |
| {"current_steps": 233, "total_steps": 400, "loss": 0.1215, "lr": 4.477357683661733e-07, "epoch": 58.29090909090909, "percentage": 58.25, "elapsed_time": "0:22:13", "remaining_time": "0:15:55"} | |
| {"current_steps": 234, "total_steps": 400, "loss": 0.1905, "lr": 4.4339839311604664e-07, "epoch": 58.58181818181818, "percentage": 58.5, "elapsed_time": "0:22:19", "remaining_time": "0:15:50"} | |
| {"current_steps": 235, "total_steps": 400, "loss": 0.1169, "lr": 4.390653282974263e-07, "epoch": 58.872727272727275, "percentage": 58.75, "elapsed_time": "0:22:26", "remaining_time": "0:15:45"} | |
| {"current_steps": 236, "total_steps": 400, "loss": 0.1068, "lr": 4.347369038899743e-07, "epoch": 59.0, "percentage": 59.0, "elapsed_time": "0:22:28", "remaining_time": "0:15:37"} | |
| {"current_steps": 237, "total_steps": 400, "loss": 0.115, "lr": 4.304134495199674e-07, "epoch": 59.29090909090909, "percentage": 59.25, "elapsed_time": "0:22:35", "remaining_time": "0:15:32"} | |
| {"current_steps": 238, "total_steps": 400, "loss": 0.1589, "lr": 4.2609529443519464e-07, "epoch": 59.58181818181818, "percentage": 59.5, "elapsed_time": "0:22:42", "remaining_time": "0:15:27"} | |
| {"current_steps": 239, "total_steps": 400, "loss": 0.1123, "lr": 4.2178276747988444e-07, "epoch": 59.872727272727275, "percentage": 59.75, "elapsed_time": "0:22:48", "remaining_time": "0:15:21"} | |
| {"current_steps": 240, "total_steps": 400, "loss": 0.1374, "lr": 4.1747619706966113e-07, "epoch": 60.0, "percentage": 60.0, "elapsed_time": "0:22:51", "remaining_time": "0:15:14"} | |
| {"current_steps": 241, "total_steps": 400, "loss": 0.1534, "lr": 4.131759111665348e-07, "epoch": 60.29090909090909, "percentage": 60.25, "elapsed_time": "0:22:57", "remaining_time": "0:15:08"} | |
| {"current_steps": 242, "total_steps": 400, "loss": 0.1082, "lr": 4.0888223725392624e-07, "epoch": 60.58181818181818, "percentage": 60.5, "elapsed_time": "0:23:04", "remaining_time": "0:15:03"} | |
| {"current_steps": 243, "total_steps": 400, "loss": 0.1336, "lr": 4.0459550231172755e-07, "epoch": 60.872727272727275, "percentage": 60.75, "elapsed_time": "0:23:10", "remaining_time": "0:14:58"} | |
| {"current_steps": 244, "total_steps": 400, "loss": 0.1139, "lr": 4.0031603279140144e-07, "epoch": 61.0, "percentage": 61.0, "elapsed_time": "0:23:13", "remaining_time": "0:14:50"} | |
| {"current_steps": 245, "total_steps": 400, "loss": 0.1019, "lr": 3.960441545911204e-07, "epoch": 61.29090909090909, "percentage": 61.25, "elapsed_time": "0:23:19", "remaining_time": "0:14:45"} | |
| {"current_steps": 246, "total_steps": 400, "loss": 0.109, "lr": 3.9178019303094856e-07, "epoch": 61.58181818181818, "percentage": 61.5, "elapsed_time": "0:23:26", "remaining_time": "0:14:40"} | |
| {"current_steps": 247, "total_steps": 400, "loss": 0.136, "lr": 3.8752447282806755e-07, "epoch": 61.872727272727275, "percentage": 61.75, "elapsed_time": "0:23:32", "remaining_time": "0:14:35"} | |
| {"current_steps": 248, "total_steps": 400, "loss": 0.1639, "lr": 3.8327731807204744e-07, "epoch": 62.0, "percentage": 62.0, "elapsed_time": "0:23:35", "remaining_time": "0:14:27"} | |
| {"current_steps": 249, "total_steps": 400, "loss": 0.1323, "lr": 3.790390522001662e-07, "epoch": 62.29090909090909, "percentage": 62.25, "elapsed_time": "0:23:42", "remaining_time": "0:14:22"} | |
| {"current_steps": 250, "total_steps": 400, "loss": 0.0865, "lr": 3.7480999797277917e-07, "epoch": 62.58181818181818, "percentage": 62.5, "elapsed_time": "0:23:48", "remaining_time": "0:14:17"} | |
| {"current_steps": 251, "total_steps": 400, "loss": 0.1178, "lr": 3.7059047744873955e-07, "epoch": 62.872727272727275, "percentage": 62.75, "elapsed_time": "0:23:54", "remaining_time": "0:14:11"} | |
| {"current_steps": 252, "total_steps": 400, "loss": 0.1375, "lr": 3.6638081196087153e-07, "epoch": 63.0, "percentage": 63.0, "elapsed_time": "0:23:57", "remaining_time": "0:14:04"} | |
| {"current_steps": 253, "total_steps": 400, "loss": 0.1008, "lr": 3.621813220915004e-07, "epoch": 63.29090909090909, "percentage": 63.25, "elapsed_time": "0:24:04", "remaining_time": "0:13:59"} | |
| {"current_steps": 254, "total_steps": 400, "loss": 0.1087, "lr": 3.5799232764803867e-07, "epoch": 63.58181818181818, "percentage": 63.5, "elapsed_time": "0:24:10", "remaining_time": "0:13:53"} | |
| {"current_steps": 255, "total_steps": 400, "loss": 0.1261, "lr": 3.5381414763863163e-07, "epoch": 63.872727272727275, "percentage": 63.75, "elapsed_time": "0:24:17", "remaining_time": "0:13:48"} | |
| {"current_steps": 256, "total_steps": 400, "loss": 0.1318, "lr": 3.4964710024786347e-07, "epoch": 64.0, "percentage": 64.0, "elapsed_time": "0:24:19", "remaining_time": "0:13:41"} | |
| {"current_steps": 257, "total_steps": 400, "loss": 0.091, "lr": 3.454915028125263e-07, "epoch": 64.2909090909091, "percentage": 64.25, "elapsed_time": "0:24:26", "remaining_time": "0:13:36"} | |
| {"current_steps": 258, "total_steps": 400, "loss": 0.0987, "lr": 3.41347671797454e-07, "epoch": 64.58181818181818, "percentage": 64.5, "elapsed_time": "0:24:33", "remaining_time": "0:13:30"} | |
| {"current_steps": 259, "total_steps": 400, "loss": 0.1111, "lr": 3.3721592277142173e-07, "epoch": 64.87272727272727, "percentage": 64.75, "elapsed_time": "0:24:39", "remaining_time": "0:13:25"} | |
| {"current_steps": 260, "total_steps": 400, "loss": 0.1852, "lr": 3.330965703831146e-07, "epoch": 65.0, "percentage": 65.0, "elapsed_time": "0:24:42", "remaining_time": "0:13:18"} | |
| {"current_steps": 261, "total_steps": 400, "loss": 0.1025, "lr": 3.2898992833716563e-07, "epoch": 65.2909090909091, "percentage": 65.25, "elapsed_time": "0:24:48", "remaining_time": "0:13:12"} | |
| {"current_steps": 262, "total_steps": 400, "loss": 0.1093, "lr": 3.248963093702662e-07, "epoch": 65.58181818181818, "percentage": 65.5, "elapsed_time": "0:24:54", "remaining_time": "0:13:07"} | |
| {"current_steps": 263, "total_steps": 400, "loss": 0.1124, "lr": 3.2081602522734985e-07, "epoch": 65.87272727272727, "percentage": 65.75, "elapsed_time": "0:25:01", "remaining_time": "0:13:02"} | |
| {"current_steps": 264, "total_steps": 400, "loss": 0.0882, "lr": 3.167493866378514e-07, "epoch": 66.0, "percentage": 66.0, "elapsed_time": "0:25:04", "remaining_time": "0:12:54"} | |
| {"current_steps": 265, "total_steps": 400, "loss": 0.1196, "lr": 3.1269670329204393e-07, "epoch": 66.2909090909091, "percentage": 66.25, "elapsed_time": "0:25:10", "remaining_time": "0:12:49"} | |
| {"current_steps": 266, "total_steps": 400, "loss": 0.0893, "lr": 3.086582838174551e-07, "epoch": 66.58181818181818, "percentage": 66.5, "elapsed_time": "0:25:17", "remaining_time": "0:12:44"} | |
| {"current_steps": 267, "total_steps": 400, "loss": 0.1058, "lr": 3.0463443575536317e-07, "epoch": 66.87272727272727, "percentage": 66.75, "elapsed_time": "0:25:23", "remaining_time": "0:12:38"} | |
| {"current_steps": 268, "total_steps": 400, "loss": 0.0891, "lr": 3.006254655373769e-07, "epoch": 67.0, "percentage": 67.0, "elapsed_time": "0:25:26", "remaining_time": "0:12:31"} | |
| {"current_steps": 269, "total_steps": 400, "loss": 0.0957, "lr": 2.9663167846209996e-07, "epoch": 67.2909090909091, "percentage": 67.25, "elapsed_time": "0:25:32", "remaining_time": "0:12:26"} | |
| {"current_steps": 270, "total_steps": 400, "loss": 0.0807, "lr": 2.9265337867188055e-07, "epoch": 67.58181818181818, "percentage": 67.5, "elapsed_time": "0:25:38", "remaining_time": "0:12:20"} | |
| {"current_steps": 271, "total_steps": 400, "loss": 0.0932, "lr": 2.8869086912965036e-07, "epoch": 67.87272727272727, "percentage": 67.75, "elapsed_time": "0:25:45", "remaining_time": "0:12:15"} | |
| {"current_steps": 272, "total_steps": 400, "loss": 0.1499, "lr": 2.847444515958523e-07, "epoch": 68.0, "percentage": 68.0, "elapsed_time": "0:25:48", "remaining_time": "0:12:08"} | |
| {"current_steps": 273, "total_steps": 400, "loss": 0.0786, "lr": 2.808144266054612e-07, "epoch": 68.2909090909091, "percentage": 68.25, "elapsed_time": "0:25:54", "remaining_time": "0:12:03"} | |
| {"current_steps": 274, "total_steps": 400, "loss": 0.0754, "lr": 2.769010934450956e-07, "epoch": 68.58181818181818, "percentage": 68.5, "elapsed_time": "0:26:01", "remaining_time": "0:11:57"} | |
| {"current_steps": 275, "total_steps": 400, "loss": 0.1224, "lr": 2.730047501302266e-07, "epoch": 68.87272727272727, "percentage": 68.75, "elapsed_time": "0:26:08", "remaining_time": "0:11:52"} | |
| {"current_steps": 276, "total_steps": 400, "loss": 0.1018, "lr": 2.6912569338248315e-07, "epoch": 69.0, "percentage": 69.0, "elapsed_time": "0:26:10", "remaining_time": "0:11:45"} | |
| {"current_steps": 277, "total_steps": 400, "loss": 0.1036, "lr": 2.6526421860705473e-07, "epoch": 69.2909090909091, "percentage": 69.25, "elapsed_time": "0:26:17", "remaining_time": "0:11:40"} | |
| {"current_steps": 278, "total_steps": 400, "loss": 0.0825, "lr": 2.6142061987019574e-07, "epoch": 69.58181818181818, "percentage": 69.5, "elapsed_time": "0:26:24", "remaining_time": "0:11:35"} | |
| {"current_steps": 279, "total_steps": 400, "loss": 0.0847, "lr": 2.575951898768315e-07, "epoch": 69.87272727272727, "percentage": 69.75, "elapsed_time": "0:26:30", "remaining_time": "0:11:29"} | |
| {"current_steps": 280, "total_steps": 400, "loss": 0.099, "lr": 2.537882199482665e-07, "epoch": 70.0, "percentage": 70.0, "elapsed_time": "0:26:32", "remaining_time": "0:11:22"} | |
| {"current_steps": 281, "total_steps": 400, "loss": 0.0913, "lr": 2.500000000000001e-07, "epoch": 70.2909090909091, "percentage": 70.25, "elapsed_time": "0:26:39", "remaining_time": "0:11:17"} | |
| {"current_steps": 282, "total_steps": 400, "loss": 0.1158, "lr": 2.4623081851964805e-07, "epoch": 70.58181818181818, "percentage": 70.5, "elapsed_time": "0:26:45", "remaining_time": "0:11:11"} | |
| {"current_steps": 283, "total_steps": 400, "loss": 0.0729, "lr": 2.424809625449729e-07, "epoch": 70.87272727272727, "percentage": 70.75, "elapsed_time": "0:26:52", "remaining_time": "0:11:06"} | |
| {"current_steps": 284, "total_steps": 400, "loss": 0.0634, "lr": 2.387507176420256e-07, "epoch": 71.0, "percentage": 71.0, "elapsed_time": "0:26:55", "remaining_time": "0:10:59"} | |
| {"current_steps": 285, "total_steps": 400, "loss": 0.0724, "lr": 2.350403678833976e-07, "epoch": 71.2909090909091, "percentage": 71.25, "elapsed_time": "0:27:01", "remaining_time": "0:10:54"} | |
| {"current_steps": 286, "total_steps": 400, "loss": 0.1118, "lr": 2.31350195826588e-07, "epoch": 71.58181818181818, "percentage": 71.5, "elapsed_time": "0:27:08", "remaining_time": "0:10:48"} | |
| {"current_steps": 287, "total_steps": 400, "loss": 0.0732, "lr": 2.2768048249248644e-07, "epoch": 71.87272727272727, "percentage": 71.75, "elapsed_time": "0:27:14", "remaining_time": "0:10:43"} | |
| {"current_steps": 288, "total_steps": 400, "loss": 0.0775, "lr": 2.240315073439709e-07, "epoch": 72.0, "percentage": 72.0, "elapsed_time": "0:27:17", "remaining_time": "0:10:36"} | |
| {"current_steps": 289, "total_steps": 400, "loss": 0.0643, "lr": 2.2040354826462664e-07, "epoch": 72.2909090909091, "percentage": 72.25, "elapsed_time": "0:27:23", "remaining_time": "0:10:31"} | |
| {"current_steps": 290, "total_steps": 400, "loss": 0.0908, "lr": 2.167968815375837e-07, "epoch": 72.58181818181818, "percentage": 72.5, "elapsed_time": "0:27:30", "remaining_time": "0:10:25"} | |
| {"current_steps": 291, "total_steps": 400, "loss": 0.0744, "lr": 2.1321178182447709e-07, "epoch": 72.87272727272727, "percentage": 72.75, "elapsed_time": "0:27:36", "remaining_time": "0:10:20"} | |
| {"current_steps": 292, "total_steps": 400, "loss": 0.1409, "lr": 2.096485221445301e-07, "epoch": 73.0, "percentage": 73.0, "elapsed_time": "0:27:39", "remaining_time": "0:10:13"} | |
| {"current_steps": 293, "total_steps": 400, "loss": 0.0861, "lr": 2.0610737385376348e-07, "epoch": 73.2909090909091, "percentage": 73.25, "elapsed_time": "0:27:46", "remaining_time": "0:10:08"} | |
| {"current_steps": 294, "total_steps": 400, "loss": 0.0693, "lr": 2.0258860662432942e-07, "epoch": 73.58181818181818, "percentage": 73.5, "elapsed_time": "0:27:52", "remaining_time": "0:10:02"} | |
| {"current_steps": 295, "total_steps": 400, "loss": 0.0902, "lr": 1.990924884239758e-07, "epoch": 73.87272727272727, "percentage": 73.75, "elapsed_time": "0:27:58", "remaining_time": "0:09:57"} | |
| {"current_steps": 296, "total_steps": 400, "loss": 0.0767, "lr": 1.9561928549563966e-07, "epoch": 74.0, "percentage": 74.0, "elapsed_time": "0:28:01", "remaining_time": "0:09:50"} | |
| {"current_steps": 297, "total_steps": 400, "loss": 0.0735, "lr": 1.9216926233717084e-07, "epoch": 74.2909090909091, "percentage": 74.25, "elapsed_time": "0:28:07", "remaining_time": "0:09:45"} | |
| {"current_steps": 298, "total_steps": 400, "loss": 0.0623, "lr": 1.887426816811903e-07, "epoch": 74.58181818181818, "percentage": 74.5, "elapsed_time": "0:28:13", "remaining_time": "0:09:39"} | |
| {"current_steps": 299, "total_steps": 400, "loss": 0.0971, "lr": 1.8533980447508135e-07, "epoch": 74.87272727272727, "percentage": 74.75, "elapsed_time": "0:28:21", "remaining_time": "0:09:34"} | |
| {"current_steps": 300, "total_steps": 400, "loss": 0.0776, "lr": 1.8196088986111796e-07, "epoch": 75.0, "percentage": 75.0, "elapsed_time": "0:28:23", "remaining_time": "0:09:27"} | |
| {"current_steps": 300, "total_steps": 400, "eval_loss": 1.010074496269226, "epoch": 75.0, "percentage": 75.0, "elapsed_time": "0:28:24", "remaining_time": "0:09:28"} | |
| {"current_steps": 301, "total_steps": 400, "loss": 0.0716, "lr": 1.7860619515673032e-07, "epoch": 75.2909090909091, "percentage": 75.25, "elapsed_time": "0:28:30", "remaining_time": "0:09:22"} | |
| {"current_steps": 302, "total_steps": 400, "loss": 0.0949, "lr": 1.7527597583490823e-07, "epoch": 75.58181818181818, "percentage": 75.5, "elapsed_time": "0:28:37", "remaining_time": "0:09:17"} | |
| {"current_steps": 303, "total_steps": 400, "loss": 0.075, "lr": 1.7197048550474641e-07, "epoch": 75.87272727272727, "percentage": 75.75, "elapsed_time": "0:28:43", "remaining_time": "0:09:11"} | |
| {"current_steps": 304, "total_steps": 400, "loss": 0.0544, "lr": 1.6868997589213136e-07, "epoch": 76.0, "percentage": 76.0, "elapsed_time": "0:28:46", "remaining_time": "0:09:05"} | |
| {"current_steps": 305, "total_steps": 400, "loss": 0.066, "lr": 1.6543469682057104e-07, "epoch": 76.2909090909091, "percentage": 76.25, "elapsed_time": "0:28:53", "remaining_time": "0:08:59"} | |
| {"current_steps": 306, "total_steps": 400, "loss": 0.0569, "lr": 1.6220489619216987e-07, "epoch": 76.58181818181818, "percentage": 76.5, "elapsed_time": "0:28:59", "remaining_time": "0:08:54"} | |
| {"current_steps": 307, "total_steps": 400, "loss": 0.1133, "lr": 1.590008199687508e-07, "epoch": 76.87272727272727, "percentage": 76.75, "elapsed_time": "0:29:06", "remaining_time": "0:08:48"} | |
| {"current_steps": 308, "total_steps": 400, "loss": 0.0596, "lr": 1.5582271215312293e-07, "epoch": 77.0, "percentage": 77.0, "elapsed_time": "0:29:09", "remaining_time": "0:08:42"} | |
| {"current_steps": 309, "total_steps": 400, "loss": 0.102, "lr": 1.5267081477050131e-07, "epoch": 77.2909090909091, "percentage": 77.25, "elapsed_time": "0:29:15", "remaining_time": "0:08:37"} | |
| {"current_steps": 310, "total_steps": 400, "loss": 0.06, "lr": 1.4954536785007455e-07, "epoch": 77.58181818181818, "percentage": 77.5, "elapsed_time": "0:29:22", "remaining_time": "0:08:31"} | |
| {"current_steps": 311, "total_steps": 400, "loss": 0.0668, "lr": 1.4644660940672627e-07, "epoch": 77.87272727272727, "percentage": 77.75, "elapsed_time": "0:29:28", "remaining_time": "0:08:26"} | |
| {"current_steps": 312, "total_steps": 400, "loss": 0.0602, "lr": 1.4337477542290926e-07, "epoch": 78.0, "percentage": 78.0, "elapsed_time": "0:29:31", "remaining_time": "0:08:19"} | |
| {"current_steps": 313, "total_steps": 400, "loss": 0.0762, "lr": 1.4033009983067452e-07, "epoch": 78.2909090909091, "percentage": 78.25, "elapsed_time": "0:29:38", "remaining_time": "0:08:14"} | |
| {"current_steps": 314, "total_steps": 400, "loss": 0.0861, "lr": 1.3731281449385628e-07, "epoch": 78.58181818181818, "percentage": 78.5, "elapsed_time": "0:29:45", "remaining_time": "0:08:08"} | |
| {"current_steps": 315, "total_steps": 400, "loss": 0.0617, "lr": 1.3432314919041477e-07, "epoch": 78.87272727272727, "percentage": 78.75, "elapsed_time": "0:29:51", "remaining_time": "0:08:03"} | |
| {"current_steps": 316, "total_steps": 400, "loss": 0.0472, "lr": 1.31361331594938e-07, "epoch": 79.0, "percentage": 79.0, "elapsed_time": "0:29:53", "remaining_time": "0:07:56"} | |
| {"current_steps": 317, "total_steps": 400, "loss": 0.071, "lr": 1.284275872613028e-07, "epoch": 79.2909090909091, "percentage": 79.25, "elapsed_time": "0:30:00", "remaining_time": "0:07:51"} | |
| {"current_steps": 318, "total_steps": 400, "loss": 0.0579, "lr": 1.255221396054989e-07, "epoch": 79.58181818181818, "percentage": 79.5, "elapsed_time": "0:30:06", "remaining_time": "0:07:45"} | |
| {"current_steps": 319, "total_steps": 400, "loss": 0.0605, "lr": 1.22645209888614e-07, "epoch": 79.87272727272727, "percentage": 79.75, "elapsed_time": "0:30:12", "remaining_time": "0:07:40"} | |
| {"current_steps": 320, "total_steps": 400, "loss": 0.1215, "lr": 1.1979701719998454e-07, "epoch": 80.0, "percentage": 80.0, "elapsed_time": "0:30:15", "remaining_time": "0:07:33"} | |
| {"current_steps": 321, "total_steps": 400, "loss": 0.0599, "lr": 1.1697777844051104e-07, "epoch": 80.2909090909091, "percentage": 80.25, "elapsed_time": "0:30:21", "remaining_time": "0:07:28"} | |
| {"current_steps": 322, "total_steps": 400, "loss": 0.0683, "lr": 1.141877083061401e-07, "epoch": 80.58181818181818, "percentage": 80.5, "elapsed_time": "0:30:28", "remaining_time": "0:07:22"} | |
| {"current_steps": 323, "total_steps": 400, "loss": 0.0841, "lr": 1.1142701927151454e-07, "epoch": 80.87272727272727, "percentage": 80.75, "elapsed_time": "0:30:35", "remaining_time": "0:07:17"} | |
| {"current_steps": 324, "total_steps": 400, "loss": 0.0521, "lr": 1.0869592157379304e-07, "epoch": 81.0, "percentage": 81.0, "elapsed_time": "0:30:38", "remaining_time": "0:07:11"} | |
| {"current_steps": 325, "total_steps": 400, "loss": 0.0845, "lr": 1.0599462319663904e-07, "epoch": 81.2909090909091, "percentage": 81.25, "elapsed_time": "0:30:44", "remaining_time": "0:07:05"} | |
| {"current_steps": 326, "total_steps": 400, "loss": 0.0838, "lr": 1.0332332985438247e-07, "epoch": 81.58181818181818, "percentage": 81.5, "elapsed_time": "0:30:50", "remaining_time": "0:07:00"} | |
| {"current_steps": 327, "total_steps": 400, "loss": 0.0504, "lr": 1.0068224497635369e-07, "epoch": 81.87272727272727, "percentage": 81.75, "elapsed_time": "0:30:57", "remaining_time": "0:06:54"} | |
| {"current_steps": 328, "total_steps": 400, "loss": 0.0528, "lr": 9.807156969139135e-08, "epoch": 82.0, "percentage": 82.0, "elapsed_time": "0:31:00", "remaining_time": "0:06:48"} | |
| {"current_steps": 329, "total_steps": 400, "loss": 0.0748, "lr": 9.549150281252632e-08, "epoch": 82.2909090909091, "percentage": 82.25, "elapsed_time": "0:31:06", "remaining_time": "0:06:42"} | |
| {"current_steps": 330, "total_steps": 400, "loss": 0.0833, "lr": 9.294224082184044e-08, "epoch": 82.58181818181818, "percentage": 82.5, "elapsed_time": "0:31:12", "remaining_time": "0:06:37"} | |
| {"current_steps": 331, "total_steps": 400, "loss": 0.0516, "lr": 9.042397785550404e-08, "epoch": 82.87272727272727, "percentage": 82.75, "elapsed_time": "0:31:19", "remaining_time": "0:06:31"} | |
| {"current_steps": 332, "total_steps": 400, "loss": 0.0633, "lr": 8.793690568899215e-08, "epoch": 83.0, "percentage": 83.0, "elapsed_time": "0:31:22", "remaining_time": "0:06:25"} | |
| {"current_steps": 333, "total_steps": 400, "loss": 0.0618, "lr": 8.548121372247919e-08, "epoch": 83.2909090909091, "percentage": 83.25, "elapsed_time": "0:31:29", "remaining_time": "0:06:20"} | |
| {"current_steps": 334, "total_steps": 400, "loss": 0.0481, "lr": 8.305708896641594e-08, "epoch": 83.58181818181818, "percentage": 83.5, "elapsed_time": "0:31:35", "remaining_time": "0:06:14"} | |
| {"current_steps": 335, "total_steps": 400, "loss": 0.0889, "lr": 8.066471602728803e-08, "epoch": 83.87272727272727, "percentage": 83.75, "elapsed_time": "0:31:41", "remaining_time": "0:06:08"} | |
| {"current_steps": 336, "total_steps": 400, "loss": 0.0769, "lr": 7.830427709355725e-08, "epoch": 84.0, "percentage": 84.0, "elapsed_time": "0:31:44", "remaining_time": "0:06:02"} | |
| {"current_steps": 337, "total_steps": 400, "loss": 0.056, "lr": 7.597595192178702e-08, "epoch": 84.2909090909091, "percentage": 84.25, "elapsed_time": "0:31:50", "remaining_time": "0:05:57"} | |
| {"current_steps": 338, "total_steps": 400, "loss": 0.0545, "lr": 7.36799178229539e-08, "epoch": 84.58181818181818, "percentage": 84.5, "elapsed_time": "0:31:57", "remaining_time": "0:05:51"} | |
| {"current_steps": 339, "total_steps": 400, "loss": 0.0909, "lr": 7.141634964894388e-08, "epoch": 84.87272727272727, "percentage": 84.75, "elapsed_time": "0:32:03", "remaining_time": "0:05:46"} | |
| {"current_steps": 340, "total_steps": 400, "loss": 0.0483, "lr": 6.918541977923708e-08, "epoch": 85.0, "percentage": 85.0, "elapsed_time": "0:32:06", "remaining_time": "0:05:40"} | |
| {"current_steps": 341, "total_steps": 400, "loss": 0.057, "lr": 6.698729810778064e-08, "epoch": 85.2909090909091, "percentage": 85.25, "elapsed_time": "0:32:13", "remaining_time": "0:05:34"} | |
| {"current_steps": 342, "total_steps": 400, "loss": 0.0498, "lr": 6.482215203005015e-08, "epoch": 85.58181818181818, "percentage": 85.5, "elapsed_time": "0:32:19", "remaining_time": "0:05:28"} | |
| {"current_steps": 343, "total_steps": 400, "loss": 0.0791, "lr": 6.269014643030212e-08, "epoch": 85.87272727272727, "percentage": 85.75, "elapsed_time": "0:32:26", "remaining_time": "0:05:23"} | |
| {"current_steps": 344, "total_steps": 400, "loss": 0.0849, "lr": 6.059144366901736e-08, "epoch": 86.0, "percentage": 86.0, "elapsed_time": "0:32:29", "remaining_time": "0:05:17"} | |
| {"current_steps": 345, "total_steps": 400, "loss": 0.0915, "lr": 5.8526203570536504e-08, "epoch": 86.2909090909091, "percentage": 86.25, "elapsed_time": "0:32:36", "remaining_time": "0:05:11"} | |
| {"current_steps": 346, "total_steps": 400, "loss": 0.0547, "lr": 5.649458341088914e-08, "epoch": 86.58181818181818, "percentage": 86.5, "elapsed_time": "0:32:42", "remaining_time": "0:05:06"} | |
| {"current_steps": 347, "total_steps": 400, "loss": 0.0477, "lr": 5.44967379058161e-08, "epoch": 86.87272727272727, "percentage": 86.75, "elapsed_time": "0:32:48", "remaining_time": "0:05:00"} | |
| {"current_steps": 348, "total_steps": 400, "loss": 0.057, "lr": 5.25328191989875e-08, "epoch": 87.0, "percentage": 87.0, "elapsed_time": "0:32:51", "remaining_time": "0:04:54"} | |
| {"current_steps": 349, "total_steps": 400, "loss": 0.0847, "lr": 5.060297685041659e-08, "epoch": 87.2909090909091, "percentage": 87.25, "elapsed_time": "0:32:58", "remaining_time": "0:04:49"} | |
| {"current_steps": 350, "total_steps": 400, "loss": 0.0456, "lr": 4.870735782506979e-08, "epoch": 87.58181818181818, "percentage": 87.5, "elapsed_time": "0:33:04", "remaining_time": "0:04:43"} | |
| {"current_steps": 351, "total_steps": 400, "loss": 0.0553, "lr": 4.684610648167503e-08, "epoch": 87.87272727272727, "percentage": 87.75, "elapsed_time": "0:33:10", "remaining_time": "0:04:37"} | |
| {"current_steps": 352, "total_steps": 400, "loss": 0.0671, "lr": 4.5019364561728446e-08, "epoch": 88.0, "percentage": 88.0, "elapsed_time": "0:33:14", "remaining_time": "0:04:31"} | |
| {"current_steps": 353, "total_steps": 400, "loss": 0.058, "lr": 4.322727117869951e-08, "epoch": 88.2909090909091, "percentage": 88.25, "elapsed_time": "0:33:20", "remaining_time": "0:04:26"} | |
| {"current_steps": 354, "total_steps": 400, "loss": 0.0604, "lr": 4.1469962807437976e-08, "epoch": 88.58181818181818, "percentage": 88.5, "elapsed_time": "0:33:27", "remaining_time": "0:04:20"} | |
| {"current_steps": 355, "total_steps": 400, "loss": 0.0738, "lr": 3.974757327377981e-08, "epoch": 88.87272727272727, "percentage": 88.75, "elapsed_time": "0:33:33", "remaining_time": "0:04:15"} | |
| {"current_steps": 356, "total_steps": 400, "loss": 0.0568, "lr": 3.806023374435663e-08, "epoch": 89.0, "percentage": 89.0, "elapsed_time": "0:33:36", "remaining_time": "0:04:09"} | |
| {"current_steps": 357, "total_steps": 400, "loss": 0.0559, "lr": 3.6408072716606345e-08, "epoch": 89.2909090909091, "percentage": 89.25, "elapsed_time": "0:33:42", "remaining_time": "0:04:03"} | |
| {"current_steps": 358, "total_steps": 400, "loss": 0.0872, "lr": 3.479121600898777e-08, "epoch": 89.58181818181818, "percentage": 89.5, "elapsed_time": "0:33:49", "remaining_time": "0:03:58"} | |
| {"current_steps": 359, "total_steps": 400, "loss": 0.0429, "lr": 3.3209786751399184e-08, "epoch": 89.87272727272727, "percentage": 89.75, "elapsed_time": "0:33:55", "remaining_time": "0:03:52"} | |
| {"current_steps": 360, "total_steps": 400, "loss": 0.0594, "lr": 3.166390537580121e-08, "epoch": 90.0, "percentage": 90.0, "elapsed_time": "0:33:58", "remaining_time": "0:03:46"} | |
| {"current_steps": 361, "total_steps": 400, "loss": 0.0777, "lr": 3.015368960704584e-08, "epoch": 90.2909090909091, "percentage": 90.25, "elapsed_time": "0:34:04", "remaining_time": "0:03:40"} | |
| {"current_steps": 362, "total_steps": 400, "loss": 0.0591, "lr": 2.8679254453910785e-08, "epoch": 90.58181818181818, "percentage": 90.5, "elapsed_time": "0:34:11", "remaining_time": "0:03:35"} | |
| {"current_steps": 1, "total_steps": 32, "loss": 0.7859, "lr": 0.0, "epoch": 0.2909090909090909, "percentage": 3.12, "elapsed_time": "0:00:09", "remaining_time": "0:04:53"} | |
| {"current_steps": 2, "total_steps": 32, "loss": 0.7965, "lr": 2.5e-08, "epoch": 0.5818181818181818, "percentage": 6.25, "elapsed_time": "0:00:16", "remaining_time": "0:04:03"} | |
| {"current_steps": 3, "total_steps": 32, "loss": 0.7893, "lr": 5e-08, "epoch": 0.8727272727272727, "percentage": 9.38, "elapsed_time": "0:00:23", "remaining_time": "0:03:47"} | |
| {"current_steps": 4, "total_steps": 32, "loss": 0.8701, "lr": 7.5e-08, "epoch": 1.0, "percentage": 12.5, "elapsed_time": "0:00:26", "remaining_time": "0:03:06"} | |
| {"current_steps": 5, "total_steps": 32, "loss": 0.7784, "lr": 1e-07, "epoch": 1.290909090909091, "percentage": 15.62, "elapsed_time": "0:00:34", "remaining_time": "0:03:03"} | |
| {"current_steps": 6, "total_steps": 32, "loss": 0.7589, "lr": 9.971704944519592e-08, "epoch": 1.5818181818181818, "percentage": 18.75, "elapsed_time": "0:00:40", "remaining_time": "0:02:57"} | |
| {"current_steps": 7, "total_steps": 32, "loss": 0.8307, "lr": 9.887175604818205e-08, "epoch": 1.8727272727272726, "percentage": 21.88, "elapsed_time": "0:00:47", "remaining_time": "0:02:50"} | |
| {"current_steps": 8, "total_steps": 32, "loss": 0.8821, "lr": 9.747474986387654e-08, "epoch": 2.0, "percentage": 25.0, "elapsed_time": "0:00:50", "remaining_time": "0:02:32"} | |
| {"current_steps": 9, "total_steps": 32, "loss": 0.7998, "lr": 9.554359905560885e-08, "epoch": 2.290909090909091, "percentage": 28.12, "elapsed_time": "0:00:58", "remaining_time": "0:02:28"} | |
| {"current_steps": 10, "total_steps": 32, "loss": 0.8196, "lr": 9.310258896527278e-08, "epoch": 2.581818181818182, "percentage": 31.25, "elapsed_time": "0:01:04", "remaining_time": "0:02:22"} | |
| {"current_steps": 11, "total_steps": 32, "loss": 0.7766, "lr": 9.018241671106134e-08, "epoch": 2.8727272727272726, "percentage": 34.38, "elapsed_time": "0:01:12", "remaining_time": "0:02:17"} | |
| {"current_steps": 12, "total_steps": 32, "loss": 0.8289, "lr": 8.681980515339464e-08, "epoch": 3.0, "percentage": 37.5, "elapsed_time": "0:01:15", "remaining_time": "0:02:05"} | |
| {"current_steps": 13, "total_steps": 32, "loss": 0.8375, "lr": 8.305704108364301e-08, "epoch": 3.290909090909091, "percentage": 40.62, "elapsed_time": "0:01:22", "remaining_time": "0:02:00"} | |
| {"current_steps": 14, "total_steps": 32, "loss": 0.8383, "lr": 7.894144344319013e-08, "epoch": 3.581818181818182, "percentage": 43.75, "elapsed_time": "0:01:29", "remaining_time": "0:01:54"} | |
| {"current_steps": 15, "total_steps": 32, "loss": 0.772, "lr": 7.452476826029011e-08, "epoch": 3.8727272727272726, "percentage": 46.88, "elapsed_time": "0:01:36", "remaining_time": "0:01:49"} | |
| {"current_steps": 16, "total_steps": 32, "loss": 0.7012, "lr": 6.986255778798252e-08, "epoch": 4.0, "percentage": 50.0, "elapsed_time": "0:01:39", "remaining_time": "0:01:39"} | |
| {"current_steps": 17, "total_steps": 32, "loss": 0.777, "lr": 6.501344202803413e-08, "epoch": 4.290909090909091, "percentage": 53.12, "elapsed_time": "0:02:14", "remaining_time": "0:01:58"} | |
| {"current_steps": 18, "total_steps": 32, "loss": 0.8631, "lr": 6.003840142464886e-08, "epoch": 4.581818181818182, "percentage": 56.25, "elapsed_time": "0:02:21", "remaining_time": "0:01:49"} | |
| {"current_steps": 19, "total_steps": 32, "loss": 0.7819, "lr": 5.5e-08, "epoch": 4.872727272727273, "percentage": 59.38, "elapsed_time": "0:02:28", "remaining_time": "0:01:41"} | |
| {"current_steps": 20, "total_steps": 32, "loss": 0.7722, "lr": 4.996159857535115e-08, "epoch": 5.0, "percentage": 62.5, "elapsed_time": "0:02:31", "remaining_time": "0:01:31"} | |
| {"current_steps": 21, "total_steps": 32, "loss": 0.7416, "lr": 4.498655797196585e-08, "epoch": 5.290909090909091, "percentage": 65.62, "elapsed_time": "0:02:39", "remaining_time": "0:01:23"} | |
| {"current_steps": 22, "total_steps": 32, "loss": 0.8161, "lr": 4.0137442212017494e-08, "epoch": 5.581818181818182, "percentage": 68.75, "elapsed_time": "0:02:46", "remaining_time": "0:01:15"} | |
| {"current_steps": 23, "total_steps": 32, "loss": 0.823, "lr": 3.5475231739709885e-08, "epoch": 5.872727272727273, "percentage": 71.88, "elapsed_time": "0:02:53", "remaining_time": "0:01:08"} | |
| {"current_steps": 24, "total_steps": 32, "loss": 0.8315, "lr": 3.105855655680986e-08, "epoch": 6.0, "percentage": 75.0, "elapsed_time": "0:02:56", "remaining_time": "0:00:58"} | |
| {"current_steps": 25, "total_steps": 32, "loss": 0.8316, "lr": 2.6942958916356994e-08, "epoch": 6.290909090909091, "percentage": 78.12, "elapsed_time": "0:03:04", "remaining_time": "0:00:51"} | |
| {"current_steps": 26, "total_steps": 32, "loss": 0.7542, "lr": 2.3180194846605363e-08, "epoch": 6.581818181818182, "percentage": 81.25, "elapsed_time": "0:03:11", "remaining_time": "0:00:44"} | |
| {"current_steps": 27, "total_steps": 32, "loss": 0.8357, "lr": 1.981758328893866e-08, "epoch": 6.872727272727273, "percentage": 84.38, "elapsed_time": "0:03:18", "remaining_time": "0:00:36"} | |
| {"current_steps": 28, "total_steps": 32, "loss": 0.7426, "lr": 1.6897411034727217e-08, "epoch": 7.0, "percentage": 87.5, "elapsed_time": "0:03:21", "remaining_time": "0:00:28"} | |
| {"current_steps": 29, "total_steps": 32, "loss": 0.7832, "lr": 1.4456400944391145e-08, "epoch": 7.290909090909091, "percentage": 90.62, "elapsed_time": "0:03:28", "remaining_time": "0:00:21"} | |
| {"current_steps": 30, "total_steps": 32, "loss": 0.7954, "lr": 1.2525250136123459e-08, "epoch": 7.581818181818182, "percentage": 93.75, "elapsed_time": "0:03:35", "remaining_time": "0:00:14"} | |
| {"current_steps": 31, "total_steps": 32, "loss": 0.7893, "lr": 1.1128243951817936e-08, "epoch": 7.872727272727273, "percentage": 96.88, "elapsed_time": "0:03:43", "remaining_time": "0:00:07"} | |
| {"current_steps": 32, "total_steps": 32, "loss": 0.9104, "lr": 1.0282950554804083e-08, "epoch": 8.0, "percentage": 100.0, "elapsed_time": "0:03:46", "remaining_time": "0:00:00"} | |
| {"current_steps": 32, "total_steps": 32, "epoch": 8.0, "percentage": 100.0, "elapsed_time": "0:04:11", "remaining_time": "0:00:00"} | |
| {"current_steps": 1, "total_steps": 400, "loss": 0.7859, "lr": 0.0, "epoch": 0.2909090909090909, "percentage": 0.25, "elapsed_time": "0:00:07", "remaining_time": "0:50:47"} | |
| {"current_steps": 2, "total_steps": 400, "loss": 0.7965, "lr": 2.5e-09, "epoch": 0.5818181818181818, "percentage": 0.5, "elapsed_time": "0:00:14", "remaining_time": "0:46:43"} | |
| {"current_steps": 3, "total_steps": 400, "loss": 0.7893, "lr": 5e-09, "epoch": 0.8727272727272727, "percentage": 0.75, "elapsed_time": "0:00:21", "remaining_time": "0:46:51"} | |
| {"current_steps": 4, "total_steps": 400, "loss": 0.8702, "lr": 7.5e-09, "epoch": 1.0, "percentage": 1.0, "elapsed_time": "0:00:24", "remaining_time": "0:39:53"} | |
| {"current_steps": 5, "total_steps": 400, "loss": 0.7785, "lr": 1e-08, "epoch": 1.290909090909091, "percentage": 1.25, "elapsed_time": "0:00:31", "remaining_time": "0:41:18"} | |
| {"current_steps": 6, "total_steps": 400, "loss": 0.759, "lr": 1.25e-08, "epoch": 1.5818181818181818, "percentage": 1.5, "elapsed_time": "0:00:37", "remaining_time": "0:41:30"} | |
| {"current_steps": 7, "total_steps": 400, "loss": 0.8308, "lr": 1.5e-08, "epoch": 1.8727272727272726, "percentage": 1.75, "elapsed_time": "0:00:44", "remaining_time": "0:41:43"} | |
| {"current_steps": 8, "total_steps": 400, "loss": 0.8828, "lr": 1.7499999999999998e-08, "epoch": 2.0, "percentage": 2.0, "elapsed_time": "0:00:47", "remaining_time": "0:38:57"} | |
| {"current_steps": 9, "total_steps": 400, "loss": 0.8004, "lr": 2e-08, "epoch": 2.290909090909091, "percentage": 2.25, "elapsed_time": "0:00:54", "remaining_time": "0:39:39"} | |
| {"current_steps": 10, "total_steps": 400, "loss": 0.8204, "lr": 2.25e-08, "epoch": 2.581818181818182, "percentage": 2.5, "elapsed_time": "0:01:01", "remaining_time": "0:39:46"} | |
| {"current_steps": 11, "total_steps": 400, "loss": 0.7771, "lr": 2.5e-08, "epoch": 2.8727272727272726, "percentage": 2.75, "elapsed_time": "0:01:08", "remaining_time": "0:40:12"} | |
| {"current_steps": 12, "total_steps": 400, "loss": 0.8295, "lr": 2.75e-08, "epoch": 3.0, "percentage": 3.0, "elapsed_time": "0:01:11", "remaining_time": "0:38:28"} | |
| {"current_steps": 13, "total_steps": 400, "loss": 0.8378, "lr": 3e-08, "epoch": 3.290909090909091, "percentage": 3.25, "elapsed_time": "0:01:18", "remaining_time": "0:38:52"} | |
| {"current_steps": 14, "total_steps": 400, "loss": 0.8398, "lr": 3.25e-08, "epoch": 3.581818181818182, "percentage": 3.5, "elapsed_time": "0:01:24", "remaining_time": "0:38:57"} | |
| {"current_steps": 15, "total_steps": 400, "loss": 0.773, "lr": 3.4999999999999996e-08, "epoch": 3.8727272727272726, "percentage": 3.75, "elapsed_time": "0:01:31", "remaining_time": "0:39:21"} | |
| {"current_steps": 16, "total_steps": 400, "loss": 0.7025, "lr": 3.75e-08, "epoch": 4.0, "percentage": 4.0, "elapsed_time": "0:01:34", "remaining_time": "0:37:56"} | |
| {"current_steps": 16, "total_steps": 400, "eval_loss": 0.760595977306366, "epoch": 4.0, "percentage": 4.0, "elapsed_time": "0:01:35", "remaining_time": "0:38:14"} | |
| {"current_steps": 17, "total_steps": 400, "loss": 0.7785, "lr": 4e-08, "epoch": 4.290909090909091, "percentage": 4.25, "elapsed_time": "0:02:05", "remaining_time": "0:47:18"} | |
| {"current_steps": 18, "total_steps": 400, "loss": 0.8645, "lr": 4.25e-08, "epoch": 4.581818181818182, "percentage": 4.5, "elapsed_time": "0:02:12", "remaining_time": "0:46:59"} | |
| {"current_steps": 19, "total_steps": 400, "loss": 0.7834, "lr": 4.5e-08, "epoch": 4.872727272727273, "percentage": 4.75, "elapsed_time": "0:02:20", "remaining_time": "0:46:50"} | |
| {"current_steps": 20, "total_steps": 400, "loss": 0.7744, "lr": 4.7499999999999995e-08, "epoch": 5.0, "percentage": 5.0, "elapsed_time": "0:02:23", "remaining_time": "0:45:19"} | |
| {"current_steps": 21, "total_steps": 400, "loss": 0.7433, "lr": 5e-08, "epoch": 5.290909090909091, "percentage": 5.25, "elapsed_time": "0:02:30", "remaining_time": "0:45:07"} | |
| {"current_steps": 22, "total_steps": 400, "loss": 0.818, "lr": 5.25e-08, "epoch": 5.581818181818182, "percentage": 5.5, "elapsed_time": "0:02:37", "remaining_time": "0:45:03"} | |
| {"current_steps": 23, "total_steps": 400, "loss": 0.8245, "lr": 5.5e-08, "epoch": 5.872727272727273, "percentage": 5.75, "elapsed_time": "0:02:44", "remaining_time": "0:44:56"} | |
| {"current_steps": 24, "total_steps": 400, "loss": 0.8331, "lr": 5.749999999999999e-08, "epoch": 6.0, "percentage": 6.0, "elapsed_time": "0:02:47", "remaining_time": "0:43:40"} | |
| {"current_steps": 25, "total_steps": 400, "loss": 0.8331, "lr": 6e-08, "epoch": 6.290909090909091, "percentage": 6.25, "elapsed_time": "0:02:54", "remaining_time": "0:43:33"} | |
| {"current_steps": 26, "total_steps": 400, "loss": 0.755, "lr": 6.25e-08, "epoch": 6.581818181818182, "percentage": 6.5, "elapsed_time": "0:03:01", "remaining_time": "0:43:29"} | |
| {"current_steps": 27, "total_steps": 400, "loss": 0.8372, "lr": 6.5e-08, "epoch": 6.872727272727273, "percentage": 6.75, "elapsed_time": "0:03:08", "remaining_time": "0:43:20"} | |
| {"current_steps": 28, "total_steps": 400, "loss": 0.7442, "lr": 6.75e-08, "epoch": 7.0, "percentage": 7.0, "elapsed_time": "0:03:11", "remaining_time": "0:42:18"} | |
| {"current_steps": 29, "total_steps": 400, "loss": 0.7851, "lr": 6.999999999999999e-08, "epoch": 7.290909090909091, "percentage": 7.25, "elapsed_time": "0:03:17", "remaining_time": "0:42:11"} | |
| {"current_steps": 30, "total_steps": 400, "loss": 0.7962, "lr": 7.25e-08, "epoch": 7.581818181818182, "percentage": 7.5, "elapsed_time": "0:03:24", "remaining_time": "0:42:06"} | |
| {"current_steps": 31, "total_steps": 400, "loss": 0.79, "lr": 7.5e-08, "epoch": 7.872727272727273, "percentage": 7.75, "elapsed_time": "0:03:32", "remaining_time": "0:42:06"} | |
| {"current_steps": 32, "total_steps": 400, "loss": 0.9105, "lr": 7.75e-08, "epoch": 8.0, "percentage": 8.0, "elapsed_time": "0:03:35", "remaining_time": "0:41:12"} | |
| {"current_steps": 32, "total_steps": 400, "eval_loss": 0.7589532136917114, "epoch": 8.0, "percentage": 8.0, "elapsed_time": "0:03:35", "remaining_time": "0:41:21"} | |
| {"current_steps": 33, "total_steps": 400, "loss": 0.7914, "lr": 8e-08, "epoch": 8.290909090909091, "percentage": 8.25, "elapsed_time": "0:04:00", "remaining_time": "0:44:35"} | |
| {"current_steps": 34, "total_steps": 400, "loss": 0.8344, "lr": 8.249999999999999e-08, "epoch": 8.581818181818182, "percentage": 8.5, "elapsed_time": "0:04:07", "remaining_time": "0:44:24"} | |
| {"current_steps": 35, "total_steps": 400, "loss": 0.7419, "lr": 8.5e-08, "epoch": 8.872727272727273, "percentage": 8.75, "elapsed_time": "0:04:13", "remaining_time": "0:44:07"} | |
| {"current_steps": 36, "total_steps": 400, "loss": 0.8597, "lr": 8.75e-08, "epoch": 9.0, "percentage": 9.0, "elapsed_time": "0:04:16", "remaining_time": "0:43:17"} | |
| {"current_steps": 37, "total_steps": 400, "loss": 0.7911, "lr": 9e-08, "epoch": 9.290909090909091, "percentage": 9.25, "elapsed_time": "0:04:23", "remaining_time": "0:43:05"} | |
| {"current_steps": 38, "total_steps": 400, "loss": 0.852, "lr": 9.25e-08, "epoch": 9.581818181818182, "percentage": 9.5, "elapsed_time": "0:04:30", "remaining_time": "0:42:59"} | |
| {"current_steps": 39, "total_steps": 400, "loss": 0.7942, "lr": 9.499999999999999e-08, "epoch": 9.872727272727273, "percentage": 9.75, "elapsed_time": "0:04:37", "remaining_time": "0:42:48"} | |
| {"current_steps": 40, "total_steps": 400, "loss": 0.7006, "lr": 9.749999999999999e-08, "epoch": 10.0, "percentage": 10.0, "elapsed_time": "0:04:40", "remaining_time": "0:42:03"} | |
| {"current_steps": 41, "total_steps": 400, "loss": 0.7496, "lr": 1e-07, "epoch": 10.290909090909091, "percentage": 10.25, "elapsed_time": "0:04:47", "remaining_time": "0:41:54"} | |
| {"current_steps": 42, "total_steps": 400, "loss": 0.7978, "lr": 9.99982865378877e-08, "epoch": 10.581818181818182, "percentage": 10.5, "elapsed_time": "0:04:54", "remaining_time": "0:41:47"} | |
| {"current_steps": 43, "total_steps": 400, "loss": 0.8437, "lr": 9.99931462820376e-08, "epoch": 10.872727272727273, "percentage": 10.75, "elapsed_time": "0:05:01", "remaining_time": "0:41:39"} | |
| {"current_steps": 44, "total_steps": 400, "loss": 0.7926, "lr": 9.998457962390006e-08, "epoch": 11.0, "percentage": 11.0, "elapsed_time": "0:05:03", "remaining_time": "0:40:58"} | |
| {"current_steps": 45, "total_steps": 400, "loss": 0.7521, "lr": 9.997258721585931e-08, "epoch": 11.290909090909091, "percentage": 11.25, "elapsed_time": "0:05:10", "remaining_time": "0:40:49"} | |
| {"current_steps": 46, "total_steps": 400, "loss": 0.7497, "lr": 9.99571699711836e-08, "epoch": 11.581818181818182, "percentage": 11.5, "elapsed_time": "0:05:17", "remaining_time": "0:40:42"} | |
| {"current_steps": 47, "total_steps": 400, "loss": 0.8709, "lr": 9.993832906395581e-08, "epoch": 11.872727272727273, "percentage": 11.75, "elapsed_time": "0:05:24", "remaining_time": "0:40:38"} | |
| {"current_steps": 48, "total_steps": 400, "loss": 0.8193, "lr": 9.991606592898401e-08, "epoch": 12.0, "percentage": 12.0, "elapsed_time": "0:05:27", "remaining_time": "0:40:00"} | |
| {"current_steps": 48, "total_steps": 400, "eval_loss": 0.7549822926521301, "epoch": 12.0, "percentage": 12.0, "elapsed_time": "0:05:28", "remaining_time": "0:40:06"} | |
| {"current_steps": 49, "total_steps": 400, "loss": 0.8488, "lr": 9.989038226169209e-08, "epoch": 12.290909090909091, "percentage": 12.25, "elapsed_time": "0:05:57", "remaining_time": "0:42:40"} | |
| {"current_steps": 50, "total_steps": 400, "loss": 0.7697, "lr": 9.986128001799076e-08, "epoch": 12.581818181818182, "percentage": 12.5, "elapsed_time": "0:06:04", "remaining_time": "0:42:33"} | |
| {"current_steps": 51, "total_steps": 400, "loss": 0.769, "lr": 9.982876141412855e-08, "epoch": 12.872727272727273, "percentage": 12.75, "elapsed_time": "0:06:11", "remaining_time": "0:42:22"} | |
| {"current_steps": 52, "total_steps": 400, "loss": 0.8111, "lr": 9.979282892652304e-08, "epoch": 13.0, "percentage": 13.0, "elapsed_time": "0:06:14", "remaining_time": "0:41:48"} | |
| {"current_steps": 53, "total_steps": 400, "loss": 0.798, "lr": 9.975348529157229e-08, "epoch": 13.290909090909091, "percentage": 13.25, "elapsed_time": "0:06:21", "remaining_time": "0:41:39"} | |
| {"current_steps": 54, "total_steps": 400, "loss": 0.8011, "lr": 9.971073350544643e-08, "epoch": 13.581818181818182, "percentage": 13.5, "elapsed_time": "0:06:28", "remaining_time": "0:41:30"} | |
| {"current_steps": 55, "total_steps": 400, "loss": 0.7109, "lr": 9.966457682385949e-08, "epoch": 13.872727272727273, "percentage": 13.75, "elapsed_time": "0:06:35", "remaining_time": "0:41:23"} | |
| {"current_steps": 56, "total_steps": 400, "loss": 0.969, "lr": 9.961501876182147e-08, "epoch": 14.0, "percentage": 14.0, "elapsed_time": "0:06:38", "remaining_time": "0:40:50"} | |
| {"current_steps": 57, "total_steps": 400, "loss": 0.7757, "lr": 9.956206309337066e-08, "epoch": 14.290909090909091, "percentage": 14.25, "elapsed_time": "0:06:46", "remaining_time": "0:40:44"} | |
| {"current_steps": 58, "total_steps": 400, "loss": 0.7974, "lr": 9.950571385128625e-08, "epoch": 14.581818181818182, "percentage": 14.5, "elapsed_time": "0:06:53", "remaining_time": "0:40:35"} | |
| {"current_steps": 59, "total_steps": 400, "loss": 0.842, "lr": 9.94459753267812e-08, "epoch": 14.872727272727273, "percentage": 14.75, "elapsed_time": "0:06:59", "remaining_time": "0:40:26"} | |
| {"current_steps": 60, "total_steps": 400, "loss": 0.7127, "lr": 9.938285206917541e-08, "epoch": 15.0, "percentage": 15.0, "elapsed_time": "0:07:02", "remaining_time": "0:39:55"} | |
| {"current_steps": 61, "total_steps": 400, "loss": 0.7662, "lr": 9.931634888554937e-08, "epoch": 15.290909090909091, "percentage": 15.25, "elapsed_time": "0:07:10", "remaining_time": "0:39:51"} | |
| {"current_steps": 62, "total_steps": 400, "loss": 0.7652, "lr": 9.924647084037797e-08, "epoch": 15.581818181818182, "percentage": 15.5, "elapsed_time": "0:07:16", "remaining_time": "0:39:40"} | |
| {"current_steps": 63, "total_steps": 400, "loss": 0.854, "lr": 9.917322325514488e-08, "epoch": 15.872727272727273, "percentage": 15.75, "elapsed_time": "0:07:23", "remaining_time": "0:39:33"} | |
| {"current_steps": 64, "total_steps": 400, "loss": 0.6939, "lr": 9.909661170793732e-08, "epoch": 16.0, "percentage": 16.0, "elapsed_time": "0:07:26", "remaining_time": "0:39:04"} | |
| {"current_steps": 64, "total_steps": 400, "eval_loss": 0.7460314631462097, "epoch": 16.0, "percentage": 16.0, "elapsed_time": "0:07:27", "remaining_time": "0:39:08"} | |
| {"current_steps": 65, "total_steps": 400, "loss": 0.7894, "lr": 9.901664203302125e-08, "epoch": 16.29090909090909, "percentage": 16.25, "elapsed_time": "0:07:53", "remaining_time": "0:40:40"} | |
| {"current_steps": 66, "total_steps": 400, "loss": 0.7476, "lr": 9.8933320320397e-08, "epoch": 16.581818181818182, "percentage": 16.5, "elapsed_time": "0:07:59", "remaining_time": "0:40:28"} | |
| {"current_steps": 67, "total_steps": 400, "loss": 0.8294, "lr": 9.884665291533559e-08, "epoch": 16.87272727272727, "percentage": 16.75, "elapsed_time": "0:08:06", "remaining_time": "0:40:20"} | |
| {"current_steps": 68, "total_steps": 400, "loss": 0.741, "lr": 9.875664641789545e-08, "epoch": 17.0, "percentage": 17.0, "elapsed_time": "0:08:09", "remaining_time": "0:39:51"} | |
| {"current_steps": 69, "total_steps": 400, "loss": 0.7999, "lr": 9.866330768241983e-08, "epoch": 17.29090909090909, "percentage": 17.25, "elapsed_time": "0:08:16", "remaining_time": "0:39:42"} | |
| {"current_steps": 70, "total_steps": 400, "loss": 0.8324, "lr": 9.856664381701484e-08, "epoch": 17.581818181818182, "percentage": 17.5, "elapsed_time": "0:08:23", "remaining_time": "0:39:32"} | |
| {"current_steps": 71, "total_steps": 400, "loss": 0.7308, "lr": 9.846666218300807e-08, "epoch": 17.87272727272727, "percentage": 17.75, "elapsed_time": "0:08:29", "remaining_time": "0:39:22"} | |
| {"current_steps": 72, "total_steps": 400, "loss": 0.7691, "lr": 9.836337039438803e-08, "epoch": 18.0, "percentage": 18.0, "elapsed_time": "0:08:33", "remaining_time": "0:38:58"} | |
| {"current_steps": 73, "total_steps": 400, "loss": 0.7804, "lr": 9.825677631722435e-08, "epoch": 18.29090909090909, "percentage": 18.25, "elapsed_time": "0:08:39", "remaining_time": "0:38:49"} | |
| {"current_steps": 74, "total_steps": 400, "loss": 0.808, "lr": 9.814688806906868e-08, "epoch": 18.581818181818182, "percentage": 18.5, "elapsed_time": "0:08:46", "remaining_time": "0:38:40"} | |
| {"current_steps": 75, "total_steps": 400, "loss": 0.7593, "lr": 9.80337140183366e-08, "epoch": 18.87272727272727, "percentage": 18.75, "elapsed_time": "0:08:53", "remaining_time": "0:38:32"} | |
| {"current_steps": 76, "total_steps": 400, "loss": 0.795, "lr": 9.791726278367021e-08, "epoch": 19.0, "percentage": 19.0, "elapsed_time": "0:08:56", "remaining_time": "0:38:07"} | |
| {"current_steps": 77, "total_steps": 400, "loss": 0.8303, "lr": 9.779754323328191e-08, "epoch": 19.29090909090909, "percentage": 19.25, "elapsed_time": "0:09:03", "remaining_time": "0:37:58"} | |
| {"current_steps": 78, "total_steps": 400, "loss": 0.7404, "lr": 9.767456448427896e-08, "epoch": 19.581818181818182, "percentage": 19.5, "elapsed_time": "0:09:09", "remaining_time": "0:37:50"} | |
| {"current_steps": 79, "total_steps": 400, "loss": 0.8152, "lr": 9.754833590196926e-08, "epoch": 19.87272727272727, "percentage": 19.75, "elapsed_time": "0:09:16", "remaining_time": "0:37:43"} | |
| {"current_steps": 80, "total_steps": 400, "loss": 0.6623, "lr": 9.741886709914803e-08, "epoch": 20.0, "percentage": 20.0, "elapsed_time": "0:09:20", "remaining_time": "0:37:20"} | |
| {"current_steps": 80, "total_steps": 400, "eval_loss": 0.7418057918548584, "epoch": 20.0, "percentage": 20.0, "elapsed_time": "0:09:20", "remaining_time": "0:37:23"} | |
| {"current_steps": 81, "total_steps": 400, "loss": 0.726, "lr": 9.728616793536587e-08, "epoch": 20.29090909090909, "percentage": 20.25, "elapsed_time": "0:09:49", "remaining_time": "0:38:43"} | |
| {"current_steps": 82, "total_steps": 400, "loss": 0.7908, "lr": 9.715024851617789e-08, "epoch": 20.581818181818182, "percentage": 20.5, "elapsed_time": "0:09:56", "remaining_time": "0:38:34"} | |
| {"current_steps": 83, "total_steps": 400, "loss": 0.8219, "lr": 9.701111919237408e-08, "epoch": 20.87272727272727, "percentage": 20.75, "elapsed_time": "0:10:03", "remaining_time": "0:38:24"} | |
| {"current_steps": 84, "total_steps": 400, "loss": 0.7955, "lr": 9.68687905591911e-08, "epoch": 21.0, "percentage": 21.0, "elapsed_time": "0:10:06", "remaining_time": "0:38:03"} | |
| {"current_steps": 85, "total_steps": 400, "loss": 0.8459, "lr": 9.672327345550542e-08, "epoch": 21.29090909090909, "percentage": 21.25, "elapsed_time": "0:10:14", "remaining_time": "0:37:57"} | |
| {"current_steps": 86, "total_steps": 400, "loss": 0.7952, "lr": 9.65745789630079e-08, "epoch": 21.581818181818182, "percentage": 21.5, "elapsed_time": "0:10:21", "remaining_time": "0:37:47"} | |
| {"current_steps": 87, "total_steps": 400, "loss": 0.6928, "lr": 9.642271840535982e-08, "epoch": 21.87272727272727, "percentage": 21.75, "elapsed_time": "0:10:28", "remaining_time": "0:37:40"} | |
| {"current_steps": 88, "total_steps": 400, "loss": 0.7813, "lr": 9.626770334733058e-08, "epoch": 22.0, "percentage": 22.0, "elapsed_time": "0:10:31", "remaining_time": "0:37:17"} | |
| {"current_steps": 89, "total_steps": 400, "loss": 0.783, "lr": 9.610954559391703e-08, "epoch": 22.29090909090909, "percentage": 22.25, "elapsed_time": "0:10:37", "remaining_time": "0:37:08"} | |
| {"current_steps": 90, "total_steps": 400, "loss": 0.7859, "lr": 9.594825718944444e-08, "epoch": 22.581818181818182, "percentage": 22.5, "elapsed_time": "0:10:44", "remaining_time": "0:36:58"} | |
| {"current_steps": 91, "total_steps": 400, "loss": 0.7784, "lr": 9.578385041664925e-08, "epoch": 22.87272727272727, "percentage": 22.75, "elapsed_time": "0:10:51", "remaining_time": "0:36:51"} | |
| {"current_steps": 92, "total_steps": 400, "loss": 0.7613, "lr": 9.561633779574373e-08, "epoch": 23.0, "percentage": 23.0, "elapsed_time": "0:10:54", "remaining_time": "0:36:31"} | |
| {"current_steps": 93, "total_steps": 400, "loss": 0.7708, "lr": 9.544573208346251e-08, "epoch": 23.29090909090909, "percentage": 23.25, "elapsed_time": "0:11:01", "remaining_time": "0:36:24"} | |
| {"current_steps": 94, "total_steps": 400, "loss": 0.7975, "lr": 9.527204627209113e-08, "epoch": 23.581818181818182, "percentage": 23.5, "elapsed_time": "0:11:08", "remaining_time": "0:36:15"} | |
| {"current_steps": 95, "total_steps": 400, "loss": 0.7533, "lr": 9.509529358847655e-08, "epoch": 23.87272727272727, "percentage": 23.75, "elapsed_time": "0:11:15", "remaining_time": "0:36:07"} | |
| {"current_steps": 96, "total_steps": 400, "loss": 0.8112, "lr": 9.491548749301997e-08, "epoch": 24.0, "percentage": 24.0, "elapsed_time": "0:11:18", "remaining_time": "0:35:48"} | |
| {"current_steps": 96, "total_steps": 400, "eval_loss": 0.7388671040534973, "epoch": 24.0, "percentage": 24.0, "elapsed_time": "0:11:19", "remaining_time": "0:35:50"} | |
| {"current_steps": 97, "total_steps": 400, "loss": 0.779, "lr": 9.473264167865172e-08, "epoch": 24.29090909090909, "percentage": 24.25, "elapsed_time": "0:11:44", "remaining_time": "0:36:41"} | |
| {"current_steps": 98, "total_steps": 400, "loss": 0.7427, "lr": 9.454677006978843e-08, "epoch": 24.581818181818182, "percentage": 24.5, "elapsed_time": "0:11:51", "remaining_time": "0:36:32"} | |
| {"current_steps": 99, "total_steps": 400, "loss": 0.7749, "lr": 9.435788682127281e-08, "epoch": 24.87272727272727, "percentage": 24.75, "elapsed_time": "0:11:58", "remaining_time": "0:36:24"} | |
| {"current_steps": 100, "total_steps": 400, "loss": 0.8413, "lr": 9.416600631729548e-08, "epoch": 25.0, "percentage": 25.0, "elapsed_time": "0:12:01", "remaining_time": "0:36:03"} | |
| {"current_steps": 101, "total_steps": 400, "loss": 0.7987, "lr": 9.397114317029974e-08, "epoch": 25.29090909090909, "percentage": 25.25, "elapsed_time": "0:12:08", "remaining_time": "0:35:56"} | |
| {"current_steps": 102, "total_steps": 400, "loss": 0.7579, "lr": 9.377331221986867e-08, "epoch": 25.581818181818182, "percentage": 25.5, "elapsed_time": "0:12:14", "remaining_time": "0:35:47"} | |
| {"current_steps": 103, "total_steps": 400, "loss": 0.7138, "lr": 9.357252853159505e-08, "epoch": 25.87272727272727, "percentage": 25.75, "elapsed_time": "0:12:21", "remaining_time": "0:35:38"} | |
| {"current_steps": 104, "total_steps": 400, "loss": 0.8143, "lr": 9.336880739593415e-08, "epoch": 26.0, "percentage": 26.0, "elapsed_time": "0:12:24", "remaining_time": "0:35:20"} | |
| {"current_steps": 105, "total_steps": 400, "loss": 0.7595, "lr": 9.316216432703917e-08, "epoch": 26.29090909090909, "percentage": 26.25, "elapsed_time": "0:12:31", "remaining_time": "0:35:12"} | |
| {"current_steps": 106, "total_steps": 400, "loss": 0.6892, "lr": 9.295261506157986e-08, "epoch": 26.581818181818182, "percentage": 26.5, "elapsed_time": "0:12:38", "remaining_time": "0:35:03"} | |
| {"current_steps": 107, "total_steps": 400, "loss": 0.7828, "lr": 9.274017555754408e-08, "epoch": 26.87272727272727, "percentage": 26.75, "elapsed_time": "0:12:44", "remaining_time": "0:34:54"} | |
| {"current_steps": 108, "total_steps": 400, "loss": 0.8267, "lr": 9.252486199302256e-08, "epoch": 27.0, "percentage": 27.0, "elapsed_time": "0:12:48", "remaining_time": "0:34:37"} | |
| {"current_steps": 109, "total_steps": 400, "loss": 0.7837, "lr": 9.230669076497686e-08, "epoch": 27.29090909090909, "percentage": 27.25, "elapsed_time": "0:12:55", "remaining_time": "0:34:29"} | |
| {"current_steps": 110, "total_steps": 400, "loss": 0.7629, "lr": 9.20856784879907e-08, "epoch": 27.581818181818182, "percentage": 27.5, "elapsed_time": "0:13:01", "remaining_time": "0:34:20"} | |
| {"current_steps": 111, "total_steps": 400, "loss": 0.732, "lr": 9.186184199300463e-08, "epoch": 27.87272727272727, "percentage": 27.75, "elapsed_time": "0:13:09", "remaining_time": "0:34:14"} | |
| {"current_steps": 112, "total_steps": 400, "loss": 0.708, "lr": 9.163519832603437e-08, "epoch": 28.0, "percentage": 28.0, "elapsed_time": "0:13:11", "remaining_time": "0:33:56"} | |
| {"current_steps": 112, "total_steps": 400, "eval_loss": 0.7153984904289246, "epoch": 28.0, "percentage": 28.0, "elapsed_time": "0:13:12", "remaining_time": "0:33:57"} | |
| {"current_steps": 113, "total_steps": 400, "loss": 0.7923, "lr": 9.140576474687262e-08, "epoch": 28.29090909090909, "percentage": 28.25, "elapsed_time": "0:13:41", "remaining_time": "0:34:47"} | |
| {"current_steps": 114, "total_steps": 400, "loss": 0.6965, "lr": 9.117355872777476e-08, "epoch": 28.581818181818182, "percentage": 28.5, "elapsed_time": "0:13:48", "remaining_time": "0:34:39"} | |
| {"current_steps": 115, "total_steps": 400, "loss": 0.7564, "lr": 9.093859795212817e-08, "epoch": 28.87272727272727, "percentage": 28.75, "elapsed_time": "0:13:55", "remaining_time": "0:34:30"} | |
| {"current_steps": 116, "total_steps": 400, "loss": 0.7325, "lr": 9.070090031310558e-08, "epoch": 29.0, "percentage": 29.0, "elapsed_time": "0:13:58", "remaining_time": "0:34:13"} | |
| {"current_steps": 117, "total_steps": 400, "loss": 0.6957, "lr": 9.046048391230248e-08, "epoch": 29.29090909090909, "percentage": 29.25, "elapsed_time": "0:14:05", "remaining_time": "0:34:06"} | |
| {"current_steps": 118, "total_steps": 400, "loss": 0.8011, "lr": 9.021736705835861e-08, "epoch": 29.581818181818182, "percentage": 29.5, "elapsed_time": "0:14:13", "remaining_time": "0:33:59"} | |
| {"current_steps": 119, "total_steps": 400, "loss": 0.7767, "lr": 8.997156826556369e-08, "epoch": 29.87272727272727, "percentage": 29.75, "elapsed_time": "0:14:19", "remaining_time": "0:33:50"} | |
| {"current_steps": 120, "total_steps": 400, "loss": 0.6864, "lr": 8.97231062524474e-08, "epoch": 30.0, "percentage": 30.0, "elapsed_time": "0:14:23", "remaining_time": "0:33:33"} | |
| {"current_steps": 121, "total_steps": 400, "loss": 0.757, "lr": 8.9471999940354e-08, "epoch": 30.29090909090909, "percentage": 30.25, "elapsed_time": "0:14:30", "remaining_time": "0:33:26"} | |
| {"current_steps": 122, "total_steps": 400, "loss": 0.7184, "lr": 8.921826845200139e-08, "epoch": 30.581818181818182, "percentage": 30.5, "elapsed_time": "0:14:37", "remaining_time": "0:33:19"} | |
| {"current_steps": 123, "total_steps": 400, "loss": 0.8074, "lr": 8.896193111002475e-08, "epoch": 30.87272727272727, "percentage": 30.75, "elapsed_time": "0:14:44", "remaining_time": "0:33:10"} | |
| {"current_steps": 124, "total_steps": 400, "loss": 0.666, "lr": 8.87030074355051e-08, "epoch": 31.0, "percentage": 31.0, "elapsed_time": "0:14:47", "remaining_time": "0:32:54"} | |
| {"current_steps": 125, "total_steps": 400, "loss": 0.7109, "lr": 8.844151714648274e-08, "epoch": 31.29090909090909, "percentage": 31.25, "elapsed_time": "0:14:54", "remaining_time": "0:32:47"} | |
| {"current_steps": 126, "total_steps": 400, "loss": 0.7848, "lr": 8.817748015645558e-08, "epoch": 31.581818181818182, "percentage": 31.5, "elapsed_time": "0:15:00", "remaining_time": "0:32:39"} | |
| {"current_steps": 127, "total_steps": 400, "loss": 0.7756, "lr": 8.791091657286267e-08, "epoch": 31.87272727272727, "percentage": 31.75, "elapsed_time": "0:15:08", "remaining_time": "0:32:31"} | |
| {"current_steps": 128, "total_steps": 400, "loss": 0.6471, "lr": 8.764184669555293e-08, "epoch": 32.0, "percentage": 32.0, "elapsed_time": "0:15:10", "remaining_time": "0:32:15"} | |
| {"current_steps": 128, "total_steps": 400, "eval_loss": 0.7097088694572449, "epoch": 32.0, "percentage": 32.0, "elapsed_time": "0:15:11", "remaining_time": "0:32:17"} | |
| {"current_steps": 129, "total_steps": 400, "loss": 0.7418, "lr": 8.737029101523929e-08, "epoch": 32.29090909090909, "percentage": 32.25, "elapsed_time": "0:15:43", "remaining_time": "0:33:01"} | |
| {"current_steps": 130, "total_steps": 400, "loss": 0.7407, "lr": 8.709627021193817e-08, "epoch": 32.58181818181818, "percentage": 32.5, "elapsed_time": "0:15:50", "remaining_time": "0:32:53"} | |
| {"current_steps": 131, "total_steps": 400, "loss": 0.7486, "lr": 8.681980515339464e-08, "epoch": 32.872727272727275, "percentage": 32.75, "elapsed_time": "0:15:56", "remaining_time": "0:32:44"} | |
| {"current_steps": 132, "total_steps": 400, "loss": 0.7381, "lr": 8.65409168934933e-08, "epoch": 33.0, "percentage": 33.0, "elapsed_time": "0:16:00", "remaining_time": "0:32:29"} | |
| {"current_steps": 133, "total_steps": 400, "loss": 0.8277, "lr": 8.625962667065488e-08, "epoch": 33.29090909090909, "percentage": 33.25, "elapsed_time": "0:16:07", "remaining_time": "0:32:22"} | |
| {"current_steps": 134, "total_steps": 400, "loss": 0.7345, "lr": 8.597595590621892e-08, "epoch": 33.58181818181818, "percentage": 33.5, "elapsed_time": "0:16:14", "remaining_time": "0:32:15"} | |
| {"current_steps": 135, "total_steps": 400, "loss": 0.6949, "lr": 8.568992620281244e-08, "epoch": 33.872727272727275, "percentage": 33.75, "elapsed_time": "0:16:21", "remaining_time": "0:32:06"} | |
| {"current_steps": 136, "total_steps": 400, "loss": 0.6427, "lr": 8.540155934270471e-08, "epoch": 34.0, "percentage": 34.0, "elapsed_time": "0:16:24", "remaining_time": "0:31:50"} | |
| {"current_steps": 137, "total_steps": 400, "loss": 0.7113, "lr": 8.511087728614862e-08, "epoch": 34.29090909090909, "percentage": 34.25, "elapsed_time": "0:16:31", "remaining_time": "0:31:42"} | |
| {"current_steps": 138, "total_steps": 400, "loss": 0.7422, "lr": 8.481790216970819e-08, "epoch": 34.58181818181818, "percentage": 34.5, "elapsed_time": "0:16:37", "remaining_time": "0:31:34"} | |
| {"current_steps": 139, "total_steps": 400, "loss": 0.7829, "lr": 8.452265630457283e-08, "epoch": 34.872727272727275, "percentage": 34.75, "elapsed_time": "0:16:44", "remaining_time": "0:31:26"} | |
| {"current_steps": 140, "total_steps": 400, "loss": 0.718, "lr": 8.422516217485826e-08, "epoch": 35.0, "percentage": 35.0, "elapsed_time": "0:16:47", "remaining_time": "0:31:11"} | |
| {"current_steps": 141, "total_steps": 400, "loss": 0.7046, "lr": 8.392544243589427e-08, "epoch": 35.29090909090909, "percentage": 35.25, "elapsed_time": "0:16:55", "remaining_time": "0:31:05"} | |
| {"current_steps": 142, "total_steps": 400, "loss": 0.7685, "lr": 8.362351991249938e-08, "epoch": 35.58181818181818, "percentage": 35.5, "elapsed_time": "0:17:02", "remaining_time": "0:30:57"} | |
| {"current_steps": 143, "total_steps": 400, "loss": 0.6774, "lr": 8.331941759724268e-08, "epoch": 35.872727272727275, "percentage": 35.75, "elapsed_time": "0:17:08", "remaining_time": "0:30:49"} | |
| {"current_steps": 144, "total_steps": 400, "loss": 0.9019, "lr": 8.301315864869288e-08, "epoch": 36.0, "percentage": 36.0, "elapsed_time": "0:17:11", "remaining_time": "0:30:34"} | |
| {"current_steps": 144, "total_steps": 400, "eval_loss": 0.7050113677978516, "epoch": 36.0, "percentage": 36.0, "elapsed_time": "0:17:12", "remaining_time": "0:30:35"} | |
| {"current_steps": 145, "total_steps": 400, "loss": 0.7921, "lr": 8.270476638965461e-08, "epoch": 36.29090909090909, "percentage": 36.25, "elapsed_time": "0:17:43", "remaining_time": "0:31:10"} | |
| {"current_steps": 146, "total_steps": 400, "loss": 0.6827, "lr": 8.239426430539243e-08, "epoch": 36.58181818181818, "percentage": 36.5, "elapsed_time": "0:17:50", "remaining_time": "0:31:03"} | |
| {"current_steps": 147, "total_steps": 400, "loss": 0.7774, "lr": 8.208167604184218e-08, "epoch": 36.872727272727275, "percentage": 36.75, "elapsed_time": "0:17:57", "remaining_time": "0:30:55"} | |
| {"current_steps": 148, "total_steps": 400, "loss": 0.6709, "lr": 8.176702540381035e-08, "epoch": 37.0, "percentage": 37.0, "elapsed_time": "0:18:00", "remaining_time": "0:30:40"} | |
| {"current_steps": 149, "total_steps": 400, "loss": 0.7302, "lr": 8.145033635316129e-08, "epoch": 37.29090909090909, "percentage": 37.25, "elapsed_time": "0:18:07", "remaining_time": "0:30:32"} | |
| {"current_steps": 150, "total_steps": 400, "loss": 0.7301, "lr": 8.113163300699229e-08, "epoch": 37.58181818181818, "percentage": 37.5, "elapsed_time": "0:18:14", "remaining_time": "0:30:23"} | |
| {"current_steps": 151, "total_steps": 400, "loss": 0.7223, "lr": 8.081093963579708e-08, "epoch": 37.872727272727275, "percentage": 37.75, "elapsed_time": "0:18:22", "remaining_time": "0:30:17"} | |
| {"current_steps": 152, "total_steps": 400, "loss": 0.7989, "lr": 8.048828066161747e-08, "epoch": 38.0, "percentage": 38.0, "elapsed_time": "0:18:25", "remaining_time": "0:30:02"} | |
| {"current_steps": 153, "total_steps": 400, "loss": 0.6768, "lr": 8.016368065618359e-08, "epoch": 38.29090909090909, "percentage": 38.25, "elapsed_time": "0:18:31", "remaining_time": "0:29:55"} | |
| {"current_steps": 154, "total_steps": 400, "loss": 0.7454, "lr": 7.983716433904262e-08, "epoch": 38.58181818181818, "percentage": 38.5, "elapsed_time": "0:18:38", "remaining_time": "0:29:47"} | |
| {"current_steps": 155, "total_steps": 400, "loss": 0.7511, "lr": 7.950875657567622e-08, "epoch": 38.872727272727275, "percentage": 38.75, "elapsed_time": "0:18:46", "remaining_time": "0:29:40"} | |
| {"current_steps": 156, "total_steps": 400, "loss": 0.8113, "lr": 7.917848237560708e-08, "epoch": 39.0, "percentage": 39.0, "elapsed_time": "0:18:48", "remaining_time": "0:29:25"} | |
| {"current_steps": 157, "total_steps": 400, "loss": 0.7076, "lr": 7.884636689049422e-08, "epoch": 39.29090909090909, "percentage": 39.25, "elapsed_time": "0:18:55", "remaining_time": "0:29:17"} | |
| {"current_steps": 158, "total_steps": 400, "loss": 0.7437, "lr": 7.851243541221769e-08, "epoch": 39.58181818181818, "percentage": 39.5, "elapsed_time": "0:19:02", "remaining_time": "0:29:10"} | |
| {"current_steps": 159, "total_steps": 400, "loss": 0.7404, "lr": 7.817671337095244e-08, "epoch": 39.872727272727275, "percentage": 39.75, "elapsed_time": "0:19:09", "remaining_time": "0:29:02"} | |
| {"current_steps": 160, "total_steps": 400, "loss": 0.7328, "lr": 7.78392263332317e-08, "epoch": 40.0, "percentage": 40.0, "elapsed_time": "0:19:12", "remaining_time": "0:28:49"} | |
| {"current_steps": 160, "total_steps": 400, "eval_loss": 0.7006868124008179, "epoch": 40.0, "percentage": 40.0, "elapsed_time": "0:19:13", "remaining_time": "0:28:50"} | |
| {"current_steps": 161, "total_steps": 400, "loss": 0.7431, "lr": 7.75e-08, "epoch": 40.29090909090909, "percentage": 40.25, "elapsed_time": "0:19:42", "remaining_time": "0:29:16"} | |
| {"current_steps": 162, "total_steps": 400, "loss": 0.7585, "lr": 7.715906020465603e-08, "epoch": 40.58181818181818, "percentage": 40.5, "elapsed_time": "0:19:49", "remaining_time": "0:29:08"} | |
| {"current_steps": 163, "total_steps": 400, "loss": 0.7324, "lr": 7.681643291108518e-08, "epoch": 40.872727272727275, "percentage": 40.75, "elapsed_time": "0:19:56", "remaining_time": "0:28:59"} | |
| {"current_steps": 164, "total_steps": 400, "loss": 0.6533, "lr": 7.647214421168238e-08, "epoch": 41.0, "percentage": 41.0, "elapsed_time": "0:20:00", "remaining_time": "0:28:47"} | |
| {"current_steps": 165, "total_steps": 400, "loss": 0.7135, "lr": 7.612622032536508e-08, "epoch": 41.29090909090909, "percentage": 41.25, "elapsed_time": "0:20:07", "remaining_time": "0:28:39"} | |
| {"current_steps": 166, "total_steps": 400, "loss": 0.7597, "lr": 7.577868759557654e-08, "epoch": 41.58181818181818, "percentage": 41.5, "elapsed_time": "0:20:14", "remaining_time": "0:28:31"} | |
| {"current_steps": 167, "total_steps": 400, "loss": 0.7109, "lr": 7.54295724882796e-08, "epoch": 41.872727272727275, "percentage": 41.75, "elapsed_time": "0:20:20", "remaining_time": "0:28:23"} | |
| {"current_steps": 168, "total_steps": 400, "loss": 0.7504, "lr": 7.507890158994139e-08, "epoch": 42.0, "percentage": 42.0, "elapsed_time": "0:20:24", "remaining_time": "0:28:10"} | |
| {"current_steps": 169, "total_steps": 400, "loss": 0.7096, "lr": 7.472670160550848e-08, "epoch": 42.29090909090909, "percentage": 42.25, "elapsed_time": "0:20:31", "remaining_time": "0:28:03"} | |
| {"current_steps": 170, "total_steps": 400, "loss": 0.7692, "lr": 7.437299935637328e-08, "epoch": 42.58181818181818, "percentage": 42.5, "elapsed_time": "0:20:38", "remaining_time": "0:27:55"} | |
| {"current_steps": 171, "total_steps": 400, "loss": 0.7346, "lr": 7.401782177833146e-08, "epoch": 42.872727272727275, "percentage": 42.75, "elapsed_time": "0:20:44", "remaining_time": "0:27:47"} | |
| {"current_steps": 172, "total_steps": 400, "loss": 0.6633, "lr": 7.366119591953075e-08, "epoch": 43.0, "percentage": 43.0, "elapsed_time": "0:20:47", "remaining_time": "0:27:34"} | |
| {"current_steps": 173, "total_steps": 400, "loss": 0.7365, "lr": 7.3303148938411e-08, "epoch": 43.29090909090909, "percentage": 43.25, "elapsed_time": "0:20:55", "remaining_time": "0:27:27"} | |
| {"current_steps": 174, "total_steps": 400, "loss": 0.7511, "lr": 7.294370810163607e-08, "epoch": 43.58181818181818, "percentage": 43.5, "elapsed_time": "0:21:02", "remaining_time": "0:27:19"} | |
| {"current_steps": 175, "total_steps": 400, "loss": 0.6481, "lr": 7.258290078201731e-08, "epoch": 43.872727272727275, "percentage": 43.75, "elapsed_time": "0:21:08", "remaining_time": "0:27:11"} | |
| {"current_steps": 176, "total_steps": 400, "loss": 0.8191, "lr": 7.222075445642904e-08, "epoch": 44.0, "percentage": 44.0, "elapsed_time": "0:21:11", "remaining_time": "0:26:58"} | |
| {"current_steps": 176, "total_steps": 400, "eval_loss": 0.6937930583953857, "epoch": 44.0, "percentage": 44.0, "elapsed_time": "0:21:12", "remaining_time": "0:26:59"} | |
| {"current_steps": 177, "total_steps": 400, "loss": 0.7001, "lr": 7.185729670371604e-08, "epoch": 44.29090909090909, "percentage": 44.25, "elapsed_time": "0:21:42", "remaining_time": "0:27:21"} | |
| {"current_steps": 178, "total_steps": 400, "loss": 0.786, "lr": 7.149255520259337e-08, "epoch": 44.58181818181818, "percentage": 44.5, "elapsed_time": "0:21:49", "remaining_time": "0:27:13"} | |
| {"current_steps": 179, "total_steps": 400, "loss": 0.6767, "lr": 7.11265577295385e-08, "epoch": 44.872727272727275, "percentage": 44.75, "elapsed_time": "0:21:56", "remaining_time": "0:27:05"} | |
| {"current_steps": 180, "total_steps": 400, "loss": 0.7351, "lr": 7.075933215667603e-08, "epoch": 45.0, "percentage": 45.0, "elapsed_time": "0:21:59", "remaining_time": "0:26:52"} | |
| {"current_steps": 181, "total_steps": 400, "loss": 0.7047, "lr": 7.039090644965509e-08, "epoch": 45.29090909090909, "percentage": 45.25, "elapsed_time": "0:22:06", "remaining_time": "0:26:45"} | |
| {"current_steps": 182, "total_steps": 400, "loss": 0.7113, "lr": 7.002130866551968e-08, "epoch": 45.58181818181818, "percentage": 45.5, "elapsed_time": "0:22:13", "remaining_time": "0:26:37"} | |
| {"current_steps": 183, "total_steps": 400, "loss": 0.7255, "lr": 6.965056695057204e-08, "epoch": 45.872727272727275, "percentage": 45.75, "elapsed_time": "0:22:20", "remaining_time": "0:26:30"} | |
| {"current_steps": 184, "total_steps": 400, "loss": 0.7503, "lr": 6.927870953822915e-08, "epoch": 46.0, "percentage": 46.0, "elapsed_time": "0:22:23", "remaining_time": "0:26:17"} | |
| {"current_steps": 185, "total_steps": 400, "loss": 0.7008, "lr": 6.890576474687262e-08, "epoch": 46.29090909090909, "percentage": 46.25, "elapsed_time": "0:22:30", "remaining_time": "0:26:09"} | |
| {"current_steps": 186, "total_steps": 400, "loss": 0.6925, "lr": 6.853176097769228e-08, "epoch": 46.58181818181818, "percentage": 46.5, "elapsed_time": "0:22:37", "remaining_time": "0:26:01"} | |
| {"current_steps": 187, "total_steps": 400, "loss": 0.7409, "lr": 6.815672671252315e-08, "epoch": 46.872727272727275, "percentage": 46.75, "elapsed_time": "0:22:44", "remaining_time": "0:25:54"} | |
| {"current_steps": 188, "total_steps": 400, "loss": 0.702, "lr": 6.778069051167653e-08, "epoch": 47.0, "percentage": 47.0, "elapsed_time": "0:22:47", "remaining_time": "0:25:42"} | |
| {"current_steps": 189, "total_steps": 400, "loss": 0.7085, "lr": 6.740368101176495e-08, "epoch": 47.29090909090909, "percentage": 47.25, "elapsed_time": "0:22:54", "remaining_time": "0:25:34"} | |
| {"current_steps": 190, "total_steps": 400, "loss": 0.685, "lr": 6.702572692352155e-08, "epoch": 47.58181818181818, "percentage": 47.5, "elapsed_time": "0:23:01", "remaining_time": "0:25:27"} | |
| {"current_steps": 191, "total_steps": 400, "loss": 0.7551, "lr": 6.664685702961344e-08, "epoch": 47.872727272727275, "percentage": 47.75, "elapsed_time": "0:23:08", "remaining_time": "0:25:19"} | |
| {"current_steps": 192, "total_steps": 400, "loss": 0.6327, "lr": 6.626710018244986e-08, "epoch": 48.0, "percentage": 48.0, "elapsed_time": "0:23:11", "remaining_time": "0:25:07"} | |
| {"current_steps": 192, "total_steps": 400, "eval_loss": 0.6752312183380127, "epoch": 48.0, "percentage": 48.0, "elapsed_time": "0:23:12", "remaining_time": "0:25:08"} | |
| {"current_steps": 193, "total_steps": 400, "loss": 0.7312, "lr": 6.588648530198504e-08, "epoch": 48.29090909090909, "percentage": 48.25, "elapsed_time": "0:23:37", "remaining_time": "0:25:19"} | |
| {"current_steps": 194, "total_steps": 400, "loss": 0.7467, "lr": 6.550504137351574e-08, "epoch": 48.58181818181818, "percentage": 48.5, "elapsed_time": "0:23:44", "remaining_time": "0:25:12"} | |
| {"current_steps": 195, "total_steps": 400, "loss": 0.6271, "lr": 6.512279744547392e-08, "epoch": 48.872727272727275, "percentage": 48.75, "elapsed_time": "0:23:51", "remaining_time": "0:25:04"} | |
| {"current_steps": 196, "total_steps": 400, "loss": 0.7127, "lr": 6.473978262721462e-08, "epoch": 49.0, "percentage": 49.0, "elapsed_time": "0:23:53", "remaining_time": "0:24:52"} | |
| {"current_steps": 197, "total_steps": 400, "loss": 0.7255, "lr": 6.435602608679917e-08, "epoch": 49.29090909090909, "percentage": 49.25, "elapsed_time": "0:24:00", "remaining_time": "0:24:44"} | |
| {"current_steps": 198, "total_steps": 400, "loss": 0.6177, "lr": 6.397155704877387e-08, "epoch": 49.58181818181818, "percentage": 49.5, "elapsed_time": "0:24:07", "remaining_time": "0:24:36"} | |
| {"current_steps": 199, "total_steps": 400, "loss": 0.7295, "lr": 6.358640479194451e-08, "epoch": 49.872727272727275, "percentage": 49.75, "elapsed_time": "0:24:14", "remaining_time": "0:24:28"} | |
| {"current_steps": 200, "total_steps": 400, "loss": 0.7091, "lr": 6.320059864714664e-08, "epoch": 50.0, "percentage": 50.0, "elapsed_time": "0:24:17", "remaining_time": "0:24:17"} | |
| {"current_steps": 201, "total_steps": 400, "loss": 0.7432, "lr": 6.281416799501187e-08, "epoch": 50.29090909090909, "percentage": 50.25, "elapsed_time": "0:24:24", "remaining_time": "0:24:09"} | |
| {"current_steps": 202, "total_steps": 400, "loss": 0.676, "lr": 6.242714226373049e-08, "epoch": 50.58181818181818, "percentage": 50.5, "elapsed_time": "0:24:30", "remaining_time": "0:24:01"} | |
| {"current_steps": 203, "total_steps": 400, "loss": 0.7086, "lr": 6.203955092681039e-08, "epoch": 50.872727272727275, "percentage": 50.75, "elapsed_time": "0:24:37", "remaining_time": "0:23:53"} | |
| {"current_steps": 204, "total_steps": 400, "loss": 0.5264, "lr": 6.165142350083249e-08, "epoch": 51.0, "percentage": 51.0, "elapsed_time": "0:24:40", "remaining_time": "0:23:42"} | |
| {"current_steps": 205, "total_steps": 400, "loss": 0.7346, "lr": 6.126278954320294e-08, "epoch": 51.29090909090909, "percentage": 51.25, "elapsed_time": "0:24:47", "remaining_time": "0:23:34"} | |
| {"current_steps": 206, "total_steps": 400, "loss": 0.6239, "lr": 6.087367864990232e-08, "epoch": 51.58181818181818, "percentage": 51.5, "elapsed_time": "0:24:53", "remaining_time": "0:23:26"} | |
| {"current_steps": 207, "total_steps": 400, "loss": 0.688, "lr": 6.048412045323163e-08, "epoch": 51.872727272727275, "percentage": 51.75, "elapsed_time": "0:25:00", "remaining_time": "0:23:19"} | |
| {"current_steps": 208, "total_steps": 400, "loss": 0.6903, "lr": 6.00941446195558e-08, "epoch": 52.0, "percentage": 52.0, "elapsed_time": "0:25:03", "remaining_time": "0:23:08"} | |
| {"current_steps": 208, "total_steps": 400, "eval_loss": 0.6604220271110535, "epoch": 52.0, "percentage": 52.0, "elapsed_time": "0:25:04", "remaining_time": "0:23:08"} | |
| {"current_steps": 209, "total_steps": 400, "loss": 0.6428, "lr": 5.970378084704441e-08, "epoch": 52.29090909090909, "percentage": 52.25, "elapsed_time": "0:25:34", "remaining_time": "0:23:22"} | |
| {"current_steps": 210, "total_steps": 400, "loss": 0.7572, "lr": 5.931305886341008e-08, "epoch": 52.58181818181818, "percentage": 52.5, "elapsed_time": "0:25:41", "remaining_time": "0:23:14"} | |
| {"current_steps": 211, "total_steps": 400, "loss": 0.6545, "lr": 5.892200842364462e-08, "epoch": 52.872727272727275, "percentage": 52.75, "elapsed_time": "0:25:48", "remaining_time": "0:23:07"} | |
| {"current_steps": 212, "total_steps": 400, "loss": 0.6439, "lr": 5.853065930775303e-08, "epoch": 53.0, "percentage": 53.0, "elapsed_time": "0:25:51", "remaining_time": "0:22:55"} | |
| {"current_steps": 213, "total_steps": 400, "loss": 0.677, "lr": 5.813904131848564e-08, "epoch": 53.29090909090909, "percentage": 53.25, "elapsed_time": "0:25:58", "remaining_time": "0:22:48"} | |
| {"current_steps": 214, "total_steps": 400, "loss": 0.6321, "lr": 5.7747184279068564e-08, "epoch": 53.58181818181818, "percentage": 53.5, "elapsed_time": "0:26:05", "remaining_time": "0:22:40"} | |
| {"current_steps": 215, "total_steps": 400, "loss": 0.7326, "lr": 5.735511803093248e-08, "epoch": 53.872727272727275, "percentage": 53.75, "elapsed_time": "0:26:12", "remaining_time": "0:22:32"} | |
| {"current_steps": 216, "total_steps": 400, "loss": 0.6819, "lr": 5.696287243144012e-08, "epoch": 54.0, "percentage": 54.0, "elapsed_time": "0:26:15", "remaining_time": "0:22:21"} | |
| {"current_steps": 217, "total_steps": 400, "loss": 0.6655, "lr": 5.6570477351612554e-08, "epoch": 54.29090909090909, "percentage": 54.25, "elapsed_time": "0:26:22", "remaining_time": "0:22:14"} | |
| {"current_steps": 218, "total_steps": 400, "loss": 0.6743, "lr": 5.61779626738543e-08, "epoch": 54.58181818181818, "percentage": 54.5, "elapsed_time": "0:26:29", "remaining_time": "0:22:06"} | |
| {"current_steps": 219, "total_steps": 400, "loss": 0.711, "lr": 5.5785358289677765e-08, "epoch": 54.872727272727275, "percentage": 54.75, "elapsed_time": "0:26:35", "remaining_time": "0:21:58"} | |
| {"current_steps": 220, "total_steps": 400, "loss": 0.6398, "lr": 5.539269409742683e-08, "epoch": 55.0, "percentage": 55.0, "elapsed_time": "0:26:39", "remaining_time": "0:21:48"} | |
| {"current_steps": 221, "total_steps": 400, "loss": 0.6885, "lr": 5.5e-08, "epoch": 55.29090909090909, "percentage": 55.25, "elapsed_time": "0:26:45", "remaining_time": "0:21:40"} | |
| {"current_steps": 222, "total_steps": 400, "loss": 0.6391, "lr": 5.460730590257318e-08, "epoch": 55.58181818181818, "percentage": 55.5, "elapsed_time": "0:26:52", "remaining_time": "0:21:32"} | |
| {"current_steps": 223, "total_steps": 400, "loss": 0.6684, "lr": 5.421464171032224e-08, "epoch": 55.872727272727275, "percentage": 55.75, "elapsed_time": "0:27:00", "remaining_time": "0:21:25"} | |
| {"current_steps": 224, "total_steps": 400, "loss": 0.7467, "lr": 5.382203732614572e-08, "epoch": 56.0, "percentage": 56.0, "elapsed_time": "0:27:02", "remaining_time": "0:21:15"} | |
| {"current_steps": 224, "total_steps": 400, "eval_loss": 0.6532977819442749, "epoch": 56.0, "percentage": 56.0, "elapsed_time": "0:27:03", "remaining_time": "0:21:15"} | |
| {"current_steps": 225, "total_steps": 400, "loss": 0.7395, "lr": 5.342952264838747e-08, "epoch": 56.29090909090909, "percentage": 56.25, "elapsed_time": "0:27:35", "remaining_time": "0:21:27"} | |
| {"current_steps": 226, "total_steps": 400, "loss": 0.7176, "lr": 5.303712756855988e-08, "epoch": 56.58181818181818, "percentage": 56.5, "elapsed_time": "0:27:42", "remaining_time": "0:21:19"} | |
| {"current_steps": 227, "total_steps": 400, "loss": 0.5565, "lr": 5.264488196906752e-08, "epoch": 56.872727272727275, "percentage": 56.75, "elapsed_time": "0:27:49", "remaining_time": "0:21:12"} | |
| {"current_steps": 228, "total_steps": 400, "loss": 0.7052, "lr": 5.225281572093143e-08, "epoch": 57.0, "percentage": 57.0, "elapsed_time": "0:27:52", "remaining_time": "0:21:01"} | |
| {"current_steps": 229, "total_steps": 400, "loss": 0.6931, "lr": 5.1860958681514355e-08, "epoch": 57.29090909090909, "percentage": 57.25, "elapsed_time": "0:27:59", "remaining_time": "0:20:53"} | |
| {"current_steps": 230, "total_steps": 400, "loss": 0.6126, "lr": 5.1469340692246985e-08, "epoch": 57.58181818181818, "percentage": 57.5, "elapsed_time": "0:28:06", "remaining_time": "0:20:46"} | |
| {"current_steps": 231, "total_steps": 400, "loss": 0.7149, "lr": 5.107799157635537e-08, "epoch": 57.872727272727275, "percentage": 57.75, "elapsed_time": "0:28:12", "remaining_time": "0:20:38"} | |
| {"current_steps": 232, "total_steps": 400, "loss": 0.6564, "lr": 5.068694113658992e-08, "epoch": 58.0, "percentage": 58.0, "elapsed_time": "0:28:16", "remaining_time": "0:20:28"} | |
| {"current_steps": 233, "total_steps": 400, "loss": 0.6657, "lr": 5.02962191529556e-08, "epoch": 58.29090909090909, "percentage": 58.25, "elapsed_time": "0:28:22", "remaining_time": "0:20:20"} | |
| {"current_steps": 234, "total_steps": 400, "loss": 0.7461, "lr": 4.9905855380444194e-08, "epoch": 58.58181818181818, "percentage": 58.5, "elapsed_time": "0:28:29", "remaining_time": "0:20:13"} | |
| {"current_steps": 235, "total_steps": 400, "loss": 0.5924, "lr": 4.9515879546768366e-08, "epoch": 58.872727272727275, "percentage": 58.75, "elapsed_time": "0:28:36", "remaining_time": "0:20:05"} | |
| {"current_steps": 236, "total_steps": 400, "loss": 0.6793, "lr": 4.912632135009769e-08, "epoch": 59.0, "percentage": 59.0, "elapsed_time": "0:28:39", "remaining_time": "0:19:55"} | |
| {"current_steps": 237, "total_steps": 400, "loss": 0.6648, "lr": 4.873721045679706e-08, "epoch": 59.29090909090909, "percentage": 59.25, "elapsed_time": "0:28:46", "remaining_time": "0:19:47"} | |
| {"current_steps": 238, "total_steps": 400, "loss": 0.6871, "lr": 4.8348576499167516e-08, "epoch": 59.58181818181818, "percentage": 59.5, "elapsed_time": "0:28:54", "remaining_time": "0:19:40"} | |
| {"current_steps": 239, "total_steps": 400, "loss": 0.6136, "lr": 4.7960449073189604e-08, "epoch": 59.872727272727275, "percentage": 59.75, "elapsed_time": "0:29:00", "remaining_time": "0:19:32"} | |
| {"current_steps": 240, "total_steps": 400, "loss": 0.7364, "lr": 4.75728577362695e-08, "epoch": 60.0, "percentage": 60.0, "elapsed_time": "0:29:03", "remaining_time": "0:19:22"} | |
| {"current_steps": 240, "total_steps": 400, "eval_loss": 0.6488688588142395, "epoch": 60.0, "percentage": 60.0, "elapsed_time": "0:29:04", "remaining_time": "0:19:22"} | |
| {"current_steps": 241, "total_steps": 400, "loss": 0.7386, "lr": 4.718583200498813e-08, "epoch": 60.29090909090909, "percentage": 60.25, "elapsed_time": "0:29:30", "remaining_time": "0:19:28"} | |
| {"current_steps": 242, "total_steps": 400, "loss": 0.6255, "lr": 4.6799401352853365e-08, "epoch": 60.58181818181818, "percentage": 60.5, "elapsed_time": "0:29:37", "remaining_time": "0:19:20"} | |
| {"current_steps": 243, "total_steps": 400, "loss": 0.6834, "lr": 4.641359520805548e-08, "epoch": 60.872727272727275, "percentage": 60.75, "elapsed_time": "0:29:43", "remaining_time": "0:19:12"} | |
| {"current_steps": 244, "total_steps": 400, "loss": 0.5903, "lr": 4.6028442951226135e-08, "epoch": 61.0, "percentage": 61.0, "elapsed_time": "0:29:47", "remaining_time": "0:19:02"} | |
| {"current_steps": 245, "total_steps": 400, "loss": 0.5871, "lr": 4.564397391320084e-08, "epoch": 61.29090909090909, "percentage": 61.25, "elapsed_time": "0:29:54", "remaining_time": "0:18:54"} | |
| {"current_steps": 246, "total_steps": 400, "loss": 0.6913, "lr": 4.526021737278537e-08, "epoch": 61.58181818181818, "percentage": 61.5, "elapsed_time": "0:30:00", "remaining_time": "0:18:47"} | |
| {"current_steps": 247, "total_steps": 400, "loss": 0.7115, "lr": 4.4877202554526084e-08, "epoch": 61.872727272727275, "percentage": 61.75, "elapsed_time": "0:30:07", "remaining_time": "0:18:39"} | |
| {"current_steps": 248, "total_steps": 400, "loss": 0.687, "lr": 4.449495862648427e-08, "epoch": 62.0, "percentage": 62.0, "elapsed_time": "0:30:10", "remaining_time": "0:18:29"} | |
| {"current_steps": 249, "total_steps": 400, "loss": 0.6901, "lr": 4.4113514698014955e-08, "epoch": 62.29090909090909, "percentage": 62.25, "elapsed_time": "0:30:17", "remaining_time": "0:18:22"} | |
| {"current_steps": 250, "total_steps": 400, "loss": 0.631, "lr": 4.373289981755013e-08, "epoch": 62.58181818181818, "percentage": 62.5, "elapsed_time": "0:30:24", "remaining_time": "0:18:14"} | |
| {"current_steps": 251, "total_steps": 400, "loss": 0.6351, "lr": 4.335314297038656e-08, "epoch": 62.872727272727275, "percentage": 62.75, "elapsed_time": "0:30:30", "remaining_time": "0:18:06"} | |
| {"current_steps": 252, "total_steps": 400, "loss": 0.7212, "lr": 4.297427307647844e-08, "epoch": 63.0, "percentage": 63.0, "elapsed_time": "0:30:33", "remaining_time": "0:17:56"} | |
| {"current_steps": 253, "total_steps": 400, "loss": 0.629, "lr": 4.2596318988235035e-08, "epoch": 63.29090909090909, "percentage": 63.25, "elapsed_time": "0:30:40", "remaining_time": "0:17:49"} | |
| {"current_steps": 254, "total_steps": 400, "loss": 0.6565, "lr": 4.2219309488323486e-08, "epoch": 63.58181818181818, "percentage": 63.5, "elapsed_time": "0:30:47", "remaining_time": "0:17:41"} | |
| {"current_steps": 255, "total_steps": 400, "loss": 0.6644, "lr": 4.184327328747685e-08, "epoch": 63.872727272727275, "percentage": 63.75, "elapsed_time": "0:30:54", "remaining_time": "0:17:34"} | |
| {"current_steps": 256, "total_steps": 400, "loss": 0.7706, "lr": 4.1468239022307716e-08, "epoch": 64.0, "percentage": 64.0, "elapsed_time": "0:30:56", "remaining_time": "0:17:24"} | |
| {"current_steps": 256, "total_steps": 400, "eval_loss": 0.6460027694702148, "epoch": 64.0, "percentage": 64.0, "elapsed_time": "0:30:57", "remaining_time": "0:17:24"} | |
| {"current_steps": 257, "total_steps": 400, "loss": 0.5848, "lr": 4.1094235253127375e-08, "epoch": 64.2909090909091, "percentage": 64.25, "elapsed_time": "0:31:28", "remaining_time": "0:17:30"} | |
| {"current_steps": 258, "total_steps": 400, "loss": 0.6438, "lr": 4.072129046177086e-08, "epoch": 64.58181818181818, "percentage": 64.5, "elapsed_time": "0:31:34", "remaining_time": "0:17:22"} | |
| {"current_steps": 259, "total_steps": 400, "loss": 0.7825, "lr": 4.034943304942796e-08, "epoch": 64.87272727272727, "percentage": 64.75, "elapsed_time": "0:31:41", "remaining_time": "0:17:15"} | |
| {"current_steps": 260, "total_steps": 400, "loss": 0.7003, "lr": 3.997869133448031e-08, "epoch": 65.0, "percentage": 65.0, "elapsed_time": "0:31:44", "remaining_time": "0:17:05"} | |
| {"current_steps": 261, "total_steps": 400, "loss": 0.6723, "lr": 3.960909355034491e-08, "epoch": 65.2909090909091, "percentage": 65.25, "elapsed_time": "0:31:51", "remaining_time": "0:16:58"} | |
| {"current_steps": 262, "total_steps": 400, "loss": 0.6778, "lr": 3.924066784332396e-08, "epoch": 65.58181818181818, "percentage": 65.5, "elapsed_time": "0:31:58", "remaining_time": "0:16:50"} | |
| {"current_steps": 263, "total_steps": 400, "loss": 0.6196, "lr": 3.8873442270461487e-08, "epoch": 65.87272727272727, "percentage": 65.75, "elapsed_time": "0:32:05", "remaining_time": "0:16:43"} | |
| {"current_steps": 264, "total_steps": 400, "loss": 0.7125, "lr": 3.850744479740663e-08, "epoch": 66.0, "percentage": 66.0, "elapsed_time": "0:32:08", "remaining_time": "0:16:33"} | |
| {"current_steps": 265, "total_steps": 400, "loss": 0.6958, "lr": 3.814270329628395e-08, "epoch": 66.2909090909091, "percentage": 66.25, "elapsed_time": "0:32:15", "remaining_time": "0:16:26"} | |
| {"current_steps": 266, "total_steps": 400, "loss": 0.6089, "lr": 3.777924554357096e-08, "epoch": 66.58181818181818, "percentage": 66.5, "elapsed_time": "0:32:22", "remaining_time": "0:16:18"} | |
| {"current_steps": 267, "total_steps": 400, "loss": 0.6794, "lr": 3.7417099217982684e-08, "epoch": 66.87272727272727, "percentage": 66.75, "elapsed_time": "0:32:29", "remaining_time": "0:16:11"} | |
| {"current_steps": 268, "total_steps": 400, "loss": 0.6845, "lr": 3.7056291898363926e-08, "epoch": 67.0, "percentage": 67.0, "elapsed_time": "0:32:32", "remaining_time": "0:16:01"} | |
| {"current_steps": 269, "total_steps": 400, "loss": 0.6726, "lr": 3.669685106158899e-08, "epoch": 67.2909090909091, "percentage": 67.25, "elapsed_time": "0:32:39", "remaining_time": "0:15:54"} | |
| {"current_steps": 270, "total_steps": 400, "loss": 0.6597, "lr": 3.633880408046926e-08, "epoch": 67.58181818181818, "percentage": 67.5, "elapsed_time": "0:32:45", "remaining_time": "0:15:46"} | |
| {"current_steps": 271, "total_steps": 400, "loss": 0.5967, "lr": 3.598217822166854e-08, "epoch": 67.87272727272727, "percentage": 67.75, "elapsed_time": "0:32:53", "remaining_time": "0:15:39"} | |
| {"current_steps": 272, "total_steps": 400, "loss": 0.7777, "lr": 3.5627000643626705e-08, "epoch": 68.0, "percentage": 68.0, "elapsed_time": "0:32:56", "remaining_time": "0:15:30"} | |
| {"current_steps": 272, "total_steps": 400, "eval_loss": 0.6440867185592651, "epoch": 68.0, "percentage": 68.0, "elapsed_time": "0:32:57", "remaining_time": "0:15:30"} | |
| {"current_steps": 273, "total_steps": 400, "loss": 0.6824, "lr": 3.527329839449151e-08, "epoch": 68.2909090909091, "percentage": 68.25, "elapsed_time": "0:33:28", "remaining_time": "0:15:34"} | |
| {"current_steps": 274, "total_steps": 400, "loss": 0.5956, "lr": 3.49210984100586e-08, "epoch": 68.58181818181818, "percentage": 68.5, "elapsed_time": "0:33:35", "remaining_time": "0:15:27"} | |
| {"current_steps": 275, "total_steps": 400, "loss": 0.679, "lr": 3.4570427511720395e-08, "epoch": 68.87272727272727, "percentage": 68.75, "elapsed_time": "0:33:43", "remaining_time": "0:15:19"} | |
| {"current_steps": 276, "total_steps": 400, "loss": 0.7194, "lr": 3.4221312404423483e-08, "epoch": 69.0, "percentage": 69.0, "elapsed_time": "0:33:46", "remaining_time": "0:15:10"} | |
| {"current_steps": 277, "total_steps": 400, "loss": 0.5994, "lr": 3.387377967463493e-08, "epoch": 69.2909090909091, "percentage": 69.25, "elapsed_time": "0:33:53", "remaining_time": "0:15:02"} | |
| {"current_steps": 278, "total_steps": 400, "loss": 0.6582, "lr": 3.3527855788317614e-08, "epoch": 69.58181818181818, "percentage": 69.5, "elapsed_time": "0:34:00", "remaining_time": "0:14:55"} | |
| {"current_steps": 279, "total_steps": 400, "loss": 0.7129, "lr": 3.3183567088914834e-08, "epoch": 69.87272727272727, "percentage": 69.75, "elapsed_time": "0:34:07", "remaining_time": "0:14:47"} | |
| {"current_steps": 280, "total_steps": 400, "loss": 0.7197, "lr": 3.2840939795343986e-08, "epoch": 70.0, "percentage": 70.0, "elapsed_time": "0:34:10", "remaining_time": "0:14:38"} | |
| {"current_steps": 281, "total_steps": 400, "loss": 0.6844, "lr": 3.250000000000001e-08, "epoch": 70.2909090909091, "percentage": 70.25, "elapsed_time": "0:34:16", "remaining_time": "0:14:31"} | |
| {"current_steps": 282, "total_steps": 400, "loss": 0.7062, "lr": 3.2160773666768325e-08, "epoch": 70.58181818181818, "percentage": 70.5, "elapsed_time": "0:34:23", "remaining_time": "0:14:23"} | |
| {"current_steps": 283, "total_steps": 400, "loss": 0.597, "lr": 3.182328662904756e-08, "epoch": 70.87272727272727, "percentage": 70.75, "elapsed_time": "0:34:30", "remaining_time": "0:14:16"} | |
| {"current_steps": 284, "total_steps": 400, "loss": 0.6592, "lr": 3.14875645877823e-08, "epoch": 71.0, "percentage": 71.0, "elapsed_time": "0:34:33", "remaining_time": "0:14:07"} | |
| {"current_steps": 285, "total_steps": 400, "loss": 0.6398, "lr": 3.1153633109505784e-08, "epoch": 71.2909090909091, "percentage": 71.25, "elapsed_time": "0:34:40", "remaining_time": "0:13:59"} | |
| {"current_steps": 286, "total_steps": 400, "loss": 0.6979, "lr": 3.082151762439292e-08, "epoch": 71.58181818181818, "percentage": 71.5, "elapsed_time": "0:34:47", "remaining_time": "0:13:52"} | |
| {"current_steps": 287, "total_steps": 400, "loss": 0.6352, "lr": 3.049124342432378e-08, "epoch": 71.87272727272727, "percentage": 71.75, "elapsed_time": "0:34:54", "remaining_time": "0:13:44"} | |
| {"current_steps": 288, "total_steps": 400, "loss": 0.6391, "lr": 3.0162835660957385e-08, "epoch": 72.0, "percentage": 72.0, "elapsed_time": "0:34:57", "remaining_time": "0:13:35"} | |
| {"current_steps": 288, "total_steps": 400, "eval_loss": 0.641921877861023, "epoch": 72.0, "percentage": 72.0, "elapsed_time": "0:34:58", "remaining_time": "0:13:36"} | |
| {"current_steps": 289, "total_steps": 400, "loss": 0.6219, "lr": 2.983631934381639e-08, "epoch": 72.2909090909091, "percentage": 72.25, "elapsed_time": "0:35:28", "remaining_time": "0:13:37"} | |
| {"current_steps": 290, "total_steps": 400, "loss": 0.6635, "lr": 2.9511719338382535e-08, "epoch": 72.58181818181818, "percentage": 72.5, "elapsed_time": "0:35:35", "remaining_time": "0:13:30"} | |
| {"current_steps": 291, "total_steps": 400, "loss": 0.6377, "lr": 2.918906036420294e-08, "epoch": 72.87272727272727, "percentage": 72.75, "elapsed_time": "0:35:42", "remaining_time": "0:13:22"} | |
| {"current_steps": 292, "total_steps": 400, "loss": 0.7822, "lr": 2.886836699300771e-08, "epoch": 73.0, "percentage": 73.0, "elapsed_time": "0:35:45", "remaining_time": "0:13:13"} | |
| {"current_steps": 293, "total_steps": 400, "loss": 0.609, "lr": 2.8549663646838718e-08, "epoch": 73.2909090909091, "percentage": 73.25, "elapsed_time": "0:35:52", "remaining_time": "0:13:06"} | |
| {"current_steps": 294, "total_steps": 400, "loss": 0.6728, "lr": 2.8232974596189653e-08, "epoch": 73.58181818181818, "percentage": 73.5, "elapsed_time": "0:35:59", "remaining_time": "0:12:58"} | |
| {"current_steps": 295, "total_steps": 400, "loss": 0.7013, "lr": 2.791832395815782e-08, "epoch": 73.87272727272727, "percentage": 73.75, "elapsed_time": "0:36:06", "remaining_time": "0:12:51"} | |
| {"current_steps": 296, "total_steps": 400, "loss": 0.6343, "lr": 2.760573569460757e-08, "epoch": 74.0, "percentage": 74.0, "elapsed_time": "0:36:09", "remaining_time": "0:12:42"} | |
| {"current_steps": 297, "total_steps": 400, "loss": 0.6528, "lr": 2.729523361034538e-08, "epoch": 74.2909090909091, "percentage": 74.25, "elapsed_time": "0:36:16", "remaining_time": "0:12:34"} | |
| {"current_steps": 298, "total_steps": 400, "loss": 0.6243, "lr": 2.6986841351307128e-08, "epoch": 74.58181818181818, "percentage": 74.5, "elapsed_time": "0:36:23", "remaining_time": "0:12:27"} | |
| {"current_steps": 299, "total_steps": 400, "loss": 0.6658, "lr": 2.6680582402757322e-08, "epoch": 74.87272727272727, "percentage": 74.75, "elapsed_time": "0:36:30", "remaining_time": "0:12:20"} | |
| {"current_steps": 300, "total_steps": 400, "loss": 0.7016, "lr": 2.637648008750062e-08, "epoch": 75.0, "percentage": 75.0, "elapsed_time": "0:36:33", "remaining_time": "0:12:11"} | |
| {"current_steps": 301, "total_steps": 400, "loss": 0.6661, "lr": 2.6074557564105726e-08, "epoch": 75.2909090909091, "percentage": 75.25, "elapsed_time": "0:36:40", "remaining_time": "0:12:03"} | |
| {"current_steps": 302, "total_steps": 400, "loss": 0.6277, "lr": 2.5774837825141737e-08, "epoch": 75.58181818181818, "percentage": 75.5, "elapsed_time": "0:36:48", "remaining_time": "0:11:56"} | |
| {"current_steps": 303, "total_steps": 400, "loss": 0.6863, "lr": 2.547734369542718e-08, "epoch": 75.87272727272727, "percentage": 75.75, "elapsed_time": "0:36:54", "remaining_time": "0:11:49"} | |
| {"current_steps": 304, "total_steps": 400, "loss": 0.648, "lr": 2.5182097830291825e-08, "epoch": 76.0, "percentage": 76.0, "elapsed_time": "0:36:58", "remaining_time": "0:11:40"} | |
| {"current_steps": 304, "total_steps": 400, "eval_loss": 0.6407743096351624, "epoch": 76.0, "percentage": 76.0, "elapsed_time": "0:36:58", "remaining_time": "0:11:40"} | |
| {"current_steps": 305, "total_steps": 400, "loss": 0.6552, "lr": 2.4889122713851394e-08, "epoch": 76.2909090909091, "percentage": 76.25, "elapsed_time": "0:37:24", "remaining_time": "0:11:38"} | |
| {"current_steps": 306, "total_steps": 400, "loss": 0.6147, "lr": 2.4598440657295288e-08, "epoch": 76.58181818181818, "percentage": 76.5, "elapsed_time": "0:37:30", "remaining_time": "0:11:31"} | |
| {"current_steps": 307, "total_steps": 400, "loss": 0.7181, "lr": 2.4310073797187574e-08, "epoch": 76.87272727272727, "percentage": 76.75, "elapsed_time": "0:37:37", "remaining_time": "0:11:23"} | |
| {"current_steps": 308, "total_steps": 400, "loss": 0.6115, "lr": 2.4024044093781064e-08, "epoch": 77.0, "percentage": 77.0, "elapsed_time": "0:37:40", "remaining_time": "0:11:15"} | |
| {"current_steps": 309, "total_steps": 400, "loss": 0.7065, "lr": 2.3740373329345117e-08, "epoch": 77.2909090909091, "percentage": 77.25, "elapsed_time": "0:37:47", "remaining_time": "0:11:07"} | |
| {"current_steps": 310, "total_steps": 400, "loss": 0.6265, "lr": 2.3459083106506712e-08, "epoch": 77.58181818181818, "percentage": 77.5, "elapsed_time": "0:37:54", "remaining_time": "0:11:00"} | |
| {"current_steps": 311, "total_steps": 400, "loss": 0.629, "lr": 2.3180194846605363e-08, "epoch": 77.87272727272727, "percentage": 77.75, "elapsed_time": "0:38:01", "remaining_time": "0:10:52"} | |
| {"current_steps": 312, "total_steps": 400, "loss": 0.6626, "lr": 2.2903729788061836e-08, "epoch": 78.0, "percentage": 78.0, "elapsed_time": "0:38:04", "remaining_time": "0:10:44"} | |
| {"current_steps": 313, "total_steps": 400, "loss": 0.7006, "lr": 2.2629708984760707e-08, "epoch": 78.2909090909091, "percentage": 78.25, "elapsed_time": "0:38:11", "remaining_time": "0:10:36"} | |
| {"current_steps": 314, "total_steps": 400, "loss": 0.6363, "lr": 2.2358153304447067e-08, "epoch": 78.58181818181818, "percentage": 78.5, "elapsed_time": "0:38:18", "remaining_time": "0:10:29"} | |
| {"current_steps": 315, "total_steps": 400, "loss": 0.6307, "lr": 2.2089083427137328e-08, "epoch": 78.87272727272727, "percentage": 78.75, "elapsed_time": "0:38:24", "remaining_time": "0:10:21"} | |
| {"current_steps": 316, "total_steps": 400, "loss": 0.6594, "lr": 2.182251984354442e-08, "epoch": 79.0, "percentage": 79.0, "elapsed_time": "0:38:27", "remaining_time": "0:10:13"} | |
| {"current_steps": 317, "total_steps": 400, "loss": 0.6261, "lr": 2.1558482853517254e-08, "epoch": 79.2909090909091, "percentage": 79.25, "elapsed_time": "0:38:34", "remaining_time": "0:10:06"} | |
| {"current_steps": 318, "total_steps": 400, "loss": 0.6303, "lr": 2.1296992564494903e-08, "epoch": 79.58181818181818, "percentage": 79.5, "elapsed_time": "0:38:41", "remaining_time": "0:09:58"} | |
| {"current_steps": 319, "total_steps": 400, "loss": 0.6847, "lr": 2.103806888997526e-08, "epoch": 79.87272727272727, "percentage": 79.75, "elapsed_time": "0:38:47", "remaining_time": "0:09:51"} | |
| {"current_steps": 320, "total_steps": 400, "loss": 0.704, "lr": 2.078173154799861e-08, "epoch": 80.0, "percentage": 80.0, "elapsed_time": "0:38:51", "remaining_time": "0:09:42"} | |
| {"current_steps": 320, "total_steps": 400, "eval_loss": 0.6397803425788879, "epoch": 80.0, "percentage": 80.0, "elapsed_time": "0:38:51", "remaining_time": "0:09:42"} | |
| {"current_steps": 321, "total_steps": 400, "loss": 0.6742, "lr": 2.0528000059645996e-08, "epoch": 80.2909090909091, "percentage": 80.25, "elapsed_time": "0:39:22", "remaining_time": "0:09:41"} | |
| {"current_steps": 322, "total_steps": 400, "loss": 0.6589, "lr": 2.027689374755261e-08, "epoch": 80.58181818181818, "percentage": 80.5, "elapsed_time": "0:39:29", "remaining_time": "0:09:33"} | |
| {"current_steps": 323, "total_steps": 400, "loss": 0.6384, "lr": 2.0028431734436306e-08, "epoch": 80.87272727272727, "percentage": 80.75, "elapsed_time": "0:39:37", "remaining_time": "0:09:26"} | |
| {"current_steps": 324, "total_steps": 400, "loss": 0.6523, "lr": 1.9782632941641373e-08, "epoch": 81.0, "percentage": 81.0, "elapsed_time": "0:39:40", "remaining_time": "0:09:18"} | |
| {"current_steps": 325, "total_steps": 400, "loss": 0.7186, "lr": 1.9539516087697516e-08, "epoch": 81.2909090909091, "percentage": 81.25, "elapsed_time": "0:39:47", "remaining_time": "0:09:10"} | |
| {"current_steps": 326, "total_steps": 400, "loss": 0.7155, "lr": 1.9299099686894422e-08, "epoch": 81.58181818181818, "percentage": 81.5, "elapsed_time": "0:39:54", "remaining_time": "0:09:03"} | |
| {"current_steps": 327, "total_steps": 400, "loss": 0.5796, "lr": 1.9061402047871834e-08, "epoch": 81.87272727272727, "percentage": 81.75, "elapsed_time": "0:40:01", "remaining_time": "0:08:56"} | |
| {"current_steps": 328, "total_steps": 400, "loss": 0.5744, "lr": 1.8826441272225223e-08, "epoch": 82.0, "percentage": 82.0, "elapsed_time": "0:40:04", "remaining_time": "0:08:47"} | |
| {"current_steps": 329, "total_steps": 400, "loss": 0.6681, "lr": 1.8594235253127372e-08, "epoch": 82.2909090909091, "percentage": 82.25, "elapsed_time": "0:40:11", "remaining_time": "0:08:40"} | |
| {"current_steps": 330, "total_steps": 400, "loss": 0.7103, "lr": 1.8364801673965642e-08, "epoch": 82.58181818181818, "percentage": 82.5, "elapsed_time": "0:40:17", "remaining_time": "0:08:32"} | |
| {"current_steps": 331, "total_steps": 400, "loss": 0.5704, "lr": 1.8138158006995365e-08, "epoch": 82.87272727272727, "percentage": 82.75, "elapsed_time": "0:40:25", "remaining_time": "0:08:25"} | |
| {"current_steps": 332, "total_steps": 400, "loss": 0.7128, "lr": 1.7914321512009295e-08, "epoch": 83.0, "percentage": 83.0, "elapsed_time": "0:40:28", "remaining_time": "0:08:17"} | |
| {"current_steps": 333, "total_steps": 400, "loss": 0.6072, "lr": 1.7693309235023126e-08, "epoch": 83.2909090909091, "percentage": 83.25, "elapsed_time": "0:40:35", "remaining_time": "0:08:09"} | |
| {"current_steps": 334, "total_steps": 400, "loss": 0.6525, "lr": 1.7475138006977434e-08, "epoch": 83.58181818181818, "percentage": 83.5, "elapsed_time": "0:40:42", "remaining_time": "0:08:02"} | |
| {"current_steps": 335, "total_steps": 400, "loss": 0.7323, "lr": 1.7259824442455922e-08, "epoch": 83.87272727272727, "percentage": 83.75, "elapsed_time": "0:40:48", "remaining_time": "0:07:55"} | |
| {"current_steps": 336, "total_steps": 400, "loss": 0.6316, "lr": 1.704738493842015e-08, "epoch": 84.0, "percentage": 84.0, "elapsed_time": "0:40:51", "remaining_time": "0:07:47"} | |
| {"current_steps": 336, "total_steps": 400, "eval_loss": 0.6387331485748291, "epoch": 84.0, "percentage": 84.0, "elapsed_time": "0:40:52", "remaining_time": "0:07:47"} | |
| {"current_steps": 337, "total_steps": 400, "loss": 0.6576, "lr": 1.6837835672960833e-08, "epoch": 84.2909090909091, "percentage": 84.25, "elapsed_time": "0:41:17", "remaining_time": "0:07:43"} | |
| {"current_steps": 338, "total_steps": 400, "loss": 0.6216, "lr": 1.663119260406585e-08, "epoch": 84.58181818181818, "percentage": 84.5, "elapsed_time": "0:41:24", "remaining_time": "0:07:35"} | |
| {"current_steps": 339, "total_steps": 400, "loss": 0.6975, "lr": 1.642747146840495e-08, "epoch": 84.87272727272727, "percentage": 84.75, "elapsed_time": "0:41:31", "remaining_time": "0:07:28"} | |
| {"current_steps": 340, "total_steps": 400, "loss": 0.6022, "lr": 1.6226687780131337e-08, "epoch": 85.0, "percentage": 85.0, "elapsed_time": "0:41:34", "remaining_time": "0:07:20"} | |
| {"current_steps": 341, "total_steps": 400, "loss": 0.6316, "lr": 1.602885682970026e-08, "epoch": 85.2909090909091, "percentage": 85.25, "elapsed_time": "0:41:41", "remaining_time": "0:07:12"} | |
| {"current_steps": 342, "total_steps": 400, "loss": 0.6725, "lr": 1.5833993682704515e-08, "epoch": 85.58181818181818, "percentage": 85.5, "elapsed_time": "0:41:47", "remaining_time": "0:07:05"} | |
| {"current_steps": 343, "total_steps": 400, "loss": 0.6319, "lr": 1.5642113178727193e-08, "epoch": 85.87272727272727, "percentage": 85.75, "elapsed_time": "0:41:54", "remaining_time": "0:06:57"} | |
| {"current_steps": 344, "total_steps": 400, "loss": 0.72, "lr": 1.5453229930211566e-08, "epoch": 86.0, "percentage": 86.0, "elapsed_time": "0:41:57", "remaining_time": "0:06:49"} | |
| {"current_steps": 345, "total_steps": 400, "loss": 0.7343, "lr": 1.5267358321348288e-08, "epoch": 86.2909090909091, "percentage": 86.25, "elapsed_time": "0:42:04", "remaining_time": "0:06:42"} | |
| {"current_steps": 346, "total_steps": 400, "loss": 0.6112, "lr": 1.5084512506980025e-08, "epoch": 86.58181818181818, "percentage": 86.5, "elapsed_time": "0:42:11", "remaining_time": "0:06:35"} | |
| {"current_steps": 347, "total_steps": 400, "loss": 0.6377, "lr": 1.490470641152345e-08, "epoch": 86.87272727272727, "percentage": 86.75, "elapsed_time": "0:42:17", "remaining_time": "0:06:27"} | |
| {"current_steps": 348, "total_steps": 400, "loss": 0.603, "lr": 1.4727953727908877e-08, "epoch": 87.0, "percentage": 87.0, "elapsed_time": "0:42:20", "remaining_time": "0:06:19"} | |
| {"current_steps": 349, "total_steps": 400, "loss": 0.6832, "lr": 1.4554267916537493e-08, "epoch": 87.2909090909091, "percentage": 87.25, "elapsed_time": "0:42:27", "remaining_time": "0:06:12"} | |
| {"current_steps": 350, "total_steps": 400, "loss": 0.6086, "lr": 1.438366220425628e-08, "epoch": 87.58181818181818, "percentage": 87.5, "elapsed_time": "0:42:34", "remaining_time": "0:06:04"} | |
| {"current_steps": 351, "total_steps": 400, "loss": 0.6735, "lr": 1.4216149583350753e-08, "epoch": 87.87272727272727, "percentage": 87.75, "elapsed_time": "0:42:40", "remaining_time": "0:05:57"} | |
| {"current_steps": 352, "total_steps": 400, "loss": 0.6232, "lr": 1.405174281055556e-08, "epoch": 88.0, "percentage": 88.0, "elapsed_time": "0:42:44", "remaining_time": "0:05:49"} | |
| {"current_steps": 352, "total_steps": 400, "eval_loss": 0.6380465030670166, "epoch": 88.0, "percentage": 88.0, "elapsed_time": "0:42:44", "remaining_time": "0:05:49"} | |
| {"current_steps": 353, "total_steps": 400, "loss": 0.6388, "lr": 1.3890454406082957e-08, "epoch": 88.2909090909091, "percentage": 88.25, "elapsed_time": "0:43:14", "remaining_time": "0:05:45"} | |
| {"current_steps": 354, "total_steps": 400, "loss": 0.6658, "lr": 1.3732296652669417e-08, "epoch": 88.58181818181818, "percentage": 88.5, "elapsed_time": "0:43:21", "remaining_time": "0:05:37"} | |
| {"current_steps": 355, "total_steps": 400, "loss": 0.6671, "lr": 1.3577281594640182e-08, "epoch": 88.87272727272727, "percentage": 88.75, "elapsed_time": "0:43:28", "remaining_time": "0:05:30"} | |
| {"current_steps": 356, "total_steps": 400, "loss": 0.6185, "lr": 1.3425421036992096e-08, "epoch": 89.0, "percentage": 89.0, "elapsed_time": "0:43:31", "remaining_time": "0:05:22"} | |
| {"current_steps": 357, "total_steps": 400, "loss": 0.6648, "lr": 1.327672654449457e-08, "epoch": 89.2909090909091, "percentage": 89.25, "elapsed_time": "0:43:37", "remaining_time": "0:05:15"} | |
| {"current_steps": 358, "total_steps": 400, "loss": 0.6731, "lr": 1.3131209440808898e-08, "epoch": 89.58181818181818, "percentage": 89.5, "elapsed_time": "0:43:45", "remaining_time": "0:05:08"} | |
| {"current_steps": 359, "total_steps": 400, "loss": 0.5938, "lr": 1.2988880807625927e-08, "epoch": 89.87272727272727, "percentage": 89.75, "elapsed_time": "0:43:52", "remaining_time": "0:05:00"} | |
| {"current_steps": 360, "total_steps": 400, "loss": 0.7107, "lr": 1.284975148382211e-08, "epoch": 90.0, "percentage": 90.0, "elapsed_time": "0:43:55", "remaining_time": "0:04:52"} | |
| {"current_steps": 361, "total_steps": 400, "loss": 0.6798, "lr": 1.2713832064634124e-08, "epoch": 90.2909090909091, "percentage": 90.25, "elapsed_time": "0:44:01", "remaining_time": "0:04:45"} | |
| {"current_steps": 362, "total_steps": 400, "loss": 0.6249, "lr": 1.2581132900851971e-08, "epoch": 90.58181818181818, "percentage": 90.5, "elapsed_time": "0:44:09", "remaining_time": "0:04:38"} | |
| {"current_steps": 363, "total_steps": 400, "loss": 0.6616, "lr": 1.2451664098030743e-08, "epoch": 90.87272727272727, "percentage": 90.75, "elapsed_time": "0:44:15", "remaining_time": "0:04:30"} | |
| {"current_steps": 364, "total_steps": 400, "loss": 0.6418, "lr": 1.232543551572103e-08, "epoch": 91.0, "percentage": 91.0, "elapsed_time": "0:44:18", "remaining_time": "0:04:22"} | |
| {"current_steps": 365, "total_steps": 400, "loss": 0.707, "lr": 1.2202456766718091e-08, "epoch": 91.2909090909091, "percentage": 91.25, "elapsed_time": "0:44:25", "remaining_time": "0:04:15"} | |
| {"current_steps": 366, "total_steps": 400, "loss": 0.6083, "lr": 1.2082737216329793e-08, "epoch": 91.58181818181818, "percentage": 91.5, "elapsed_time": "0:44:32", "remaining_time": "0:04:08"} | |
| {"current_steps": 367, "total_steps": 400, "loss": 0.6327, "lr": 1.1966285981663406e-08, "epoch": 91.87272727272727, "percentage": 91.75, "elapsed_time": "0:44:39", "remaining_time": "0:04:00"} | |
| {"current_steps": 368, "total_steps": 400, "loss": 0.6545, "lr": 1.1853111930931313e-08, "epoch": 92.0, "percentage": 92.0, "elapsed_time": "0:44:42", "remaining_time": "0:03:53"} | |
| {"current_steps": 368, "total_steps": 400, "eval_loss": 0.6371535062789917, "epoch": 92.0, "percentage": 92.0, "elapsed_time": "0:44:43", "remaining_time": "0:03:53"} | |
| {"current_steps": 369, "total_steps": 400, "loss": 0.5913, "lr": 1.174322368277565e-08, "epoch": 92.2909090909091, "percentage": 92.25, "elapsed_time": "0:45:15", "remaining_time": "0:03:48"} | |
| {"current_steps": 370, "total_steps": 400, "loss": 0.6869, "lr": 1.1636629605611967e-08, "epoch": 92.58181818181818, "percentage": 92.5, "elapsed_time": "0:45:22", "remaining_time": "0:03:40"} | |
| {"current_steps": 371, "total_steps": 400, "loss": 0.6699, "lr": 1.1533337816991931e-08, "epoch": 92.87272727272727, "percentage": 92.75, "elapsed_time": "0:45:29", "remaining_time": "0:03:33"} | |
| {"current_steps": 372, "total_steps": 400, "loss": 0.658, "lr": 1.1433356182985158e-08, "epoch": 93.0, "percentage": 93.0, "elapsed_time": "0:45:32", "remaining_time": "0:03:25"} | |
| {"current_steps": 373, "total_steps": 400, "loss": 0.7064, "lr": 1.133669231758016e-08, "epoch": 93.2909090909091, "percentage": 93.25, "elapsed_time": "0:45:40", "remaining_time": "0:03:18"} | |
| {"current_steps": 374, "total_steps": 400, "loss": 0.6268, "lr": 1.1243353582104555e-08, "epoch": 93.58181818181818, "percentage": 93.5, "elapsed_time": "0:45:46", "remaining_time": "0:03:10"} | |
| {"current_steps": 375, "total_steps": 400, "loss": 0.6366, "lr": 1.115334708466442e-08, "epoch": 93.87272727272727, "percentage": 93.75, "elapsed_time": "0:45:53", "remaining_time": "0:03:03"} | |
| {"current_steps": 376, "total_steps": 400, "loss": 0.5847, "lr": 1.1066679679602998e-08, "epoch": 94.0, "percentage": 94.0, "elapsed_time": "0:45:56", "remaining_time": "0:02:55"} | |
| {"current_steps": 377, "total_steps": 400, "loss": 0.6578, "lr": 1.0983357966978745e-08, "epoch": 94.2909090909091, "percentage": 94.25, "elapsed_time": "0:46:03", "remaining_time": "0:02:48"} | |
| {"current_steps": 378, "total_steps": 400, "loss": 0.6523, "lr": 1.0903388292062667e-08, "epoch": 94.58181818181818, "percentage": 94.5, "elapsed_time": "0:46:10", "remaining_time": "0:02:41"} | |
| {"current_steps": 379, "total_steps": 400, "loss": 0.6582, "lr": 1.0826776744855121e-08, "epoch": 94.87272727272727, "percentage": 94.75, "elapsed_time": "0:46:17", "remaining_time": "0:02:33"} | |
| {"current_steps": 380, "total_steps": 400, "loss": 0.6047, "lr": 1.0753529159622047e-08, "epoch": 95.0, "percentage": 95.0, "elapsed_time": "0:46:20", "remaining_time": "0:02:26"} | |
| {"current_steps": 381, "total_steps": 400, "loss": 0.6078, "lr": 1.068365111445064e-08, "epoch": 95.2909090909091, "percentage": 95.25, "elapsed_time": "0:46:26", "remaining_time": "0:02:18"} | |
| {"current_steps": 382, "total_steps": 400, "loss": 0.6347, "lr": 1.0617147930824585e-08, "epoch": 95.58181818181818, "percentage": 95.5, "elapsed_time": "0:46:34", "remaining_time": "0:02:11"} | |
| {"current_steps": 383, "total_steps": 400, "loss": 0.6709, "lr": 1.0554024673218806e-08, "epoch": 95.87272727272727, "percentage": 95.75, "elapsed_time": "0:46:40", "remaining_time": "0:02:04"} | |
| {"current_steps": 384, "total_steps": 400, "loss": 0.7126, "lr": 1.0494286148713743e-08, "epoch": 96.0, "percentage": 96.0, "elapsed_time": "0:46:43", "remaining_time": "0:01:56"} | |
| {"current_steps": 384, "total_steps": 400, "eval_loss": 0.6363654732704163, "epoch": 96.0, "percentage": 96.0, "elapsed_time": "0:46:44", "remaining_time": "0:01:56"} | |
| {"current_steps": 385, "total_steps": 400, "loss": 0.5571, "lr": 1.0437936906629333e-08, "epoch": 96.2909090909091, "percentage": 96.25, "elapsed_time": "0:47:15", "remaining_time": "0:01:50"} | |
| {"current_steps": 386, "total_steps": 400, "loss": 0.7043, "lr": 1.0384981238178533e-08, "epoch": 96.58181818181818, "percentage": 96.5, "elapsed_time": "0:47:23", "remaining_time": "0:01:43"} | |
| {"current_steps": 387, "total_steps": 400, "loss": 0.6956, "lr": 1.033542317614051e-08, "epoch": 96.87272727272727, "percentage": 96.75, "elapsed_time": "0:47:30", "remaining_time": "0:01:35"} | |
| {"current_steps": 388, "total_steps": 400, "loss": 0.5839, "lr": 1.0289266494553564e-08, "epoch": 97.0, "percentage": 97.0, "elapsed_time": "0:47:33", "remaining_time": "0:01:28"} | |
| {"current_steps": 389, "total_steps": 400, "loss": 0.629, "lr": 1.0246514708427701e-08, "epoch": 97.2909090909091, "percentage": 97.25, "elapsed_time": "0:47:40", "remaining_time": "0:01:20"} | |
| {"current_steps": 390, "total_steps": 400, "loss": 0.7125, "lr": 1.0207171073476952e-08, "epoch": 97.58181818181818, "percentage": 97.5, "elapsed_time": "0:47:46", "remaining_time": "0:01:13"} | |
| {"current_steps": 391, "total_steps": 400, "loss": 0.7004, "lr": 1.017123858587145e-08, "epoch": 97.87272727272727, "percentage": 97.75, "elapsed_time": "0:47:53", "remaining_time": "0:01:06"} | |
| {"current_steps": 392, "total_steps": 400, "loss": 0.4986, "lr": 1.0138719982009241e-08, "epoch": 98.0, "percentage": 98.0, "elapsed_time": "0:47:57", "remaining_time": "0:00:58"} | |
| {"current_steps": 393, "total_steps": 400, "loss": 0.7095, "lr": 1.0109617738307912e-08, "epoch": 98.2909090909091, "percentage": 98.25, "elapsed_time": "0:48:04", "remaining_time": "0:00:51"} | |
| {"current_steps": 394, "total_steps": 400, "loss": 0.5806, "lr": 1.0083934071015988e-08, "epoch": 98.58181818181818, "percentage": 98.5, "elapsed_time": "0:48:11", "remaining_time": "0:00:44"} | |
| {"current_steps": 395, "total_steps": 400, "loss": 0.6434, "lr": 1.0061670936044179e-08, "epoch": 98.87272727272727, "percentage": 98.75, "elapsed_time": "0:48:17", "remaining_time": "0:00:36"} | |
| {"current_steps": 396, "total_steps": 400, "loss": 0.7094, "lr": 1.0042830028816398e-08, "epoch": 99.0, "percentage": 99.0, "elapsed_time": "0:48:20", "remaining_time": "0:00:29"} | |
| {"current_steps": 397, "total_steps": 400, "loss": 0.5678, "lr": 1.002741278414069e-08, "epoch": 99.2909090909091, "percentage": 99.25, "elapsed_time": "0:48:27", "remaining_time": "0:00:21"} | |
| {"current_steps": 398, "total_steps": 400, "loss": 0.6347, "lr": 1.0015420376099922e-08, "epoch": 99.58181818181818, "percentage": 99.5, "elapsed_time": "0:48:34", "remaining_time": "0:00:14"} | |
| {"current_steps": 399, "total_steps": 400, "loss": 0.7428, "lr": 1.0006853717962394e-08, "epoch": 99.87272727272727, "percentage": 99.75, "elapsed_time": "0:48:41", "remaining_time": "0:00:07"} | |
| {"current_steps": 400, "total_steps": 400, "loss": 0.6465, "lr": 1.0001713462112291e-08, "epoch": 100.0, "percentage": 100.0, "elapsed_time": "0:48:44", "remaining_time": "0:00:00"} | |
| {"current_steps": 400, "total_steps": 400, "eval_loss": 0.6363555192947388, "epoch": 100.0, "percentage": 100.0, "elapsed_time": "0:48:45", "remaining_time": "0:00:00"} | |
| {"current_steps": 400, "total_steps": 400, "epoch": 100.0, "percentage": 100.0, "elapsed_time": "0:49:08", "remaining_time": "0:00:00"} | |