Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1d8edb387e72a8877019b79774ec7d0df1d46591c37431d7a0e042d2f75214b3
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c8d7d530b5e6fb1c1455b1e2a7bbcc52e10625a127537f9dca5b6b5676e85b85
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e4ee739813af5d106633f4aa1ad6c52bec03e2c3800b070614b402b7be613c77
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:411be6f68a57c444ca4a09c56237d9607f385157ba3ade7ae7444a3603febbfd
|
| 3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
|
@@ -199,3 +199,104 @@
|
|
| 199 |
{"current_steps": 1980, "total_steps": 3984, "loss": 0.6877, "lr": 5e-06, "epoch": 1.9872036130974784, "percentage": 49.7, "elapsed_time": "17:55:01", "remaining_time": "18:08:03"}
|
| 200 |
{"current_steps": 1990, "total_steps": 3984, "loss": 0.6913, "lr": 5e-06, "epoch": 1.997239994981809, "percentage": 49.95, "elapsed_time": "18:00:22", "remaining_time": "18:02:32"}
|
| 201 |
{"current_steps": 1992, "total_steps": 3984, "eval_loss": 0.7165391445159912, "epoch": 1.999247271358675, "percentage": 50.0, "elapsed_time": "18:13:19", "remaining_time": "18:13:19"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 199 |
{"current_steps": 1980, "total_steps": 3984, "loss": 0.6877, "lr": 5e-06, "epoch": 1.9872036130974784, "percentage": 49.7, "elapsed_time": "17:55:01", "remaining_time": "18:08:03"}
|
| 200 |
{"current_steps": 1990, "total_steps": 3984, "loss": 0.6913, "lr": 5e-06, "epoch": 1.997239994981809, "percentage": 49.95, "elapsed_time": "18:00:22", "remaining_time": "18:02:32"}
|
| 201 |
{"current_steps": 1992, "total_steps": 3984, "eval_loss": 0.7165391445159912, "epoch": 1.999247271358675, "percentage": 50.0, "elapsed_time": "18:13:19", "remaining_time": "18:13:19"}
|
| 202 |
+
{"current_steps": 2000, "total_steps": 3984, "loss": 0.7009, "lr": 5e-06, "epoch": 2.0072763768661397, "percentage": 50.2, "elapsed_time": "18:18:33", "remaining_time": "18:09:45"}
|
| 203 |
+
{"current_steps": 2010, "total_steps": 3984, "loss": 0.6453, "lr": 5e-06, "epoch": 2.0173127587504704, "percentage": 50.45, "elapsed_time": "18:23:55", "remaining_time": "18:04:08"}
|
| 204 |
+
{"current_steps": 2020, "total_steps": 3984, "loss": 0.6456, "lr": 5e-06, "epoch": 2.027349140634801, "percentage": 50.7, "elapsed_time": "18:29:18", "remaining_time": "17:58:32"}
|
| 205 |
+
{"current_steps": 2030, "total_steps": 3984, "loss": 0.6454, "lr": 5e-06, "epoch": 2.037385522519132, "percentage": 50.95, "elapsed_time": "18:34:38", "remaining_time": "17:52:54"}
|
| 206 |
+
{"current_steps": 2040, "total_steps": 3984, "loss": 0.6437, "lr": 5e-06, "epoch": 2.0474219044034627, "percentage": 51.2, "elapsed_time": "18:39:57", "remaining_time": "17:47:15"}
|
| 207 |
+
{"current_steps": 2050, "total_steps": 3984, "loss": 0.6473, "lr": 5e-06, "epoch": 2.057458286287793, "percentage": 51.46, "elapsed_time": "18:45:17", "remaining_time": "17:41:37"}
|
| 208 |
+
{"current_steps": 2060, "total_steps": 3984, "loss": 0.6466, "lr": 5e-06, "epoch": 2.067494668172124, "percentage": 51.71, "elapsed_time": "18:50:37", "remaining_time": "17:35:59"}
|
| 209 |
+
{"current_steps": 2070, "total_steps": 3984, "loss": 0.6448, "lr": 5e-06, "epoch": 2.0775310500564546, "percentage": 51.96, "elapsed_time": "18:55:57", "remaining_time": "17:30:21"}
|
| 210 |
+
{"current_steps": 2080, "total_steps": 3984, "loss": 0.648, "lr": 5e-06, "epoch": 2.0875674319407853, "percentage": 52.21, "elapsed_time": "19:01:20", "remaining_time": "17:24:45"}
|
| 211 |
+
{"current_steps": 2090, "total_steps": 3984, "loss": 0.6525, "lr": 5e-06, "epoch": 2.097603813825116, "percentage": 52.46, "elapsed_time": "19:06:43", "remaining_time": "17:19:11"}
|
| 212 |
+
{"current_steps": 2100, "total_steps": 3984, "loss": 0.6456, "lr": 5e-06, "epoch": 2.107640195709447, "percentage": 52.71, "elapsed_time": "19:12:07", "remaining_time": "17:13:37"}
|
| 213 |
+
{"current_steps": 2110, "total_steps": 3984, "loss": 0.6456, "lr": 5e-06, "epoch": 2.1176765775937776, "percentage": 52.96, "elapsed_time": "19:17:31", "remaining_time": "17:08:03"}
|
| 214 |
+
{"current_steps": 2120, "total_steps": 3984, "loss": 0.6438, "lr": 5e-06, "epoch": 2.1277129594781083, "percentage": 53.21, "elapsed_time": "19:22:52", "remaining_time": "17:02:27"}
|
| 215 |
+
{"current_steps": 2130, "total_steps": 3984, "loss": 0.6482, "lr": 5e-06, "epoch": 2.1377493413624387, "percentage": 53.46, "elapsed_time": "19:28:12", "remaining_time": "16:56:50"}
|
| 216 |
+
{"current_steps": 2140, "total_steps": 3984, "loss": 0.6482, "lr": 5e-06, "epoch": 2.1477857232467694, "percentage": 53.71, "elapsed_time": "19:33:32", "remaining_time": "16:51:13"}
|
| 217 |
+
{"current_steps": 2150, "total_steps": 3984, "loss": 0.649, "lr": 5e-06, "epoch": 2.1578221051311, "percentage": 53.97, "elapsed_time": "19:38:54", "remaining_time": "16:45:37"}
|
| 218 |
+
{"current_steps": 2160, "total_steps": 3984, "loss": 0.6457, "lr": 5e-06, "epoch": 2.167858487015431, "percentage": 54.22, "elapsed_time": "19:44:16", "remaining_time": "16:40:03"}
|
| 219 |
+
{"current_steps": 2170, "total_steps": 3984, "loss": 0.6433, "lr": 5e-06, "epoch": 2.1778948688997617, "percentage": 54.47, "elapsed_time": "19:49:38", "remaining_time": "16:34:28"}
|
| 220 |
+
{"current_steps": 2180, "total_steps": 3984, "loss": 0.6493, "lr": 5e-06, "epoch": 2.1879312507840925, "percentage": 54.72, "elapsed_time": "19:55:02", "remaining_time": "16:28:55"}
|
| 221 |
+
{"current_steps": 2190, "total_steps": 3984, "loss": 0.6515, "lr": 5e-06, "epoch": 2.197967632668423, "percentage": 54.97, "elapsed_time": "20:00:26", "remaining_time": "16:23:22"}
|
| 222 |
+
{"current_steps": 2200, "total_steps": 3984, "loss": 0.648, "lr": 5e-06, "epoch": 2.2080040145527535, "percentage": 55.22, "elapsed_time": "20:05:49", "remaining_time": "16:17:49"}
|
| 223 |
+
{"current_steps": 2210, "total_steps": 3984, "loss": 0.6526, "lr": 5e-06, "epoch": 2.2180403964370843, "percentage": 55.47, "elapsed_time": "20:11:11", "remaining_time": "16:12:14"}
|
| 224 |
+
{"current_steps": 2220, "total_steps": 3984, "loss": 0.6479, "lr": 5e-06, "epoch": 2.228076778321415, "percentage": 55.72, "elapsed_time": "20:16:31", "remaining_time": "16:06:38"}
|
| 225 |
+
{"current_steps": 2230, "total_steps": 3984, "loss": 0.6485, "lr": 5e-06, "epoch": 2.238113160205746, "percentage": 55.97, "elapsed_time": "20:21:52", "remaining_time": "16:01:03"}
|
| 226 |
+
{"current_steps": 2240, "total_steps": 3984, "loss": 0.6467, "lr": 5e-06, "epoch": 2.2481495420900766, "percentage": 56.22, "elapsed_time": "20:27:15", "remaining_time": "15:55:30"}
|
| 227 |
+
{"current_steps": 2250, "total_steps": 3984, "loss": 0.6468, "lr": 5e-06, "epoch": 2.2581859239744073, "percentage": 56.48, "elapsed_time": "20:32:38", "remaining_time": "15:49:57"}
|
| 228 |
+
{"current_steps": 2260, "total_steps": 3984, "loss": 0.6484, "lr": 5e-06, "epoch": 2.268222305858738, "percentage": 56.73, "elapsed_time": "20:38:01", "remaining_time": "15:44:24"}
|
| 229 |
+
{"current_steps": 2270, "total_steps": 3984, "loss": 0.6483, "lr": 5e-06, "epoch": 2.278258687743069, "percentage": 56.98, "elapsed_time": "20:43:23", "remaining_time": "15:38:50"}
|
| 230 |
+
{"current_steps": 2280, "total_steps": 3984, "loss": 0.6477, "lr": 5e-06, "epoch": 2.288295069627399, "percentage": 57.23, "elapsed_time": "20:48:46", "remaining_time": "15:33:17"}
|
| 231 |
+
{"current_steps": 2290, "total_steps": 3984, "loss": 0.6451, "lr": 5e-06, "epoch": 2.29833145151173, "percentage": 57.48, "elapsed_time": "20:54:10", "remaining_time": "15:27:45"}
|
| 232 |
+
{"current_steps": 2300, "total_steps": 3984, "loss": 0.6502, "lr": 5e-06, "epoch": 2.3083678333960607, "percentage": 57.73, "elapsed_time": "20:59:33", "remaining_time": "15:22:12"}
|
| 233 |
+
{"current_steps": 2310, "total_steps": 3984, "loss": 0.652, "lr": 5e-06, "epoch": 2.3184042152803914, "percentage": 57.98, "elapsed_time": "21:04:55", "remaining_time": "15:16:39"}
|
| 234 |
+
{"current_steps": 2320, "total_steps": 3984, "loss": 0.6498, "lr": 5e-06, "epoch": 2.328440597164722, "percentage": 58.23, "elapsed_time": "21:10:18", "remaining_time": "15:11:07"}
|
| 235 |
+
{"current_steps": 2330, "total_steps": 3984, "loss": 0.6486, "lr": 5e-06, "epoch": 2.338476979049053, "percentage": 58.48, "elapsed_time": "21:15:38", "remaining_time": "15:05:32"}
|
| 236 |
+
{"current_steps": 2340, "total_steps": 3984, "loss": 0.6466, "lr": 5e-06, "epoch": 2.3485133609333837, "percentage": 58.73, "elapsed_time": "21:20:59", "remaining_time": "14:59:58"}
|
| 237 |
+
{"current_steps": 2350, "total_steps": 3984, "loss": 0.6463, "lr": 5e-06, "epoch": 2.358549742817714, "percentage": 58.99, "elapsed_time": "21:26:21", "remaining_time": "14:54:25"}
|
| 238 |
+
{"current_steps": 2360, "total_steps": 3984, "loss": 0.6502, "lr": 5e-06, "epoch": 2.3685861247020448, "percentage": 59.24, "elapsed_time": "21:31:40", "remaining_time": "14:48:50"}
|
| 239 |
+
{"current_steps": 2370, "total_steps": 3984, "loss": 0.6537, "lr": 5e-06, "epoch": 2.3786225065863755, "percentage": 59.49, "elapsed_time": "21:36:59", "remaining_time": "14:43:16"}
|
| 240 |
+
{"current_steps": 2380, "total_steps": 3984, "loss": 0.6505, "lr": 5e-06, "epoch": 2.3886588884707063, "percentage": 59.74, "elapsed_time": "21:42:22", "remaining_time": "14:37:43"}
|
| 241 |
+
{"current_steps": 2390, "total_steps": 3984, "loss": 0.6467, "lr": 5e-06, "epoch": 2.398695270355037, "percentage": 59.99, "elapsed_time": "21:47:44", "remaining_time": "14:32:11"}
|
| 242 |
+
{"current_steps": 2400, "total_steps": 3984, "loss": 0.6486, "lr": 5e-06, "epoch": 2.408731652239368, "percentage": 60.24, "elapsed_time": "21:53:06", "remaining_time": "14:26:38"}
|
| 243 |
+
{"current_steps": 2410, "total_steps": 3984, "loss": 0.6511, "lr": 5e-06, "epoch": 2.4187680341236986, "percentage": 60.49, "elapsed_time": "21:58:28", "remaining_time": "14:21:06"}
|
| 244 |
+
{"current_steps": 2420, "total_steps": 3984, "loss": 0.6518, "lr": 5e-06, "epoch": 2.4288044160080293, "percentage": 60.74, "elapsed_time": "22:03:49", "remaining_time": "14:15:34"}
|
| 245 |
+
{"current_steps": 2430, "total_steps": 3984, "loss": 0.6471, "lr": 5e-06, "epoch": 2.4388407978923596, "percentage": 60.99, "elapsed_time": "22:09:09", "remaining_time": "14:10:00"}
|
| 246 |
+
{"current_steps": 2440, "total_steps": 3984, "loss": 0.6549, "lr": 5e-06, "epoch": 2.4488771797766904, "percentage": 61.24, "elapsed_time": "22:14:29", "remaining_time": "14:04:26"}
|
| 247 |
+
{"current_steps": 2450, "total_steps": 3984, "loss": 0.6489, "lr": 5e-06, "epoch": 2.458913561661021, "percentage": 61.5, "elapsed_time": "22:19:49", "remaining_time": "13:58:53"}
|
| 248 |
+
{"current_steps": 2460, "total_steps": 3984, "loss": 0.6514, "lr": 5e-06, "epoch": 2.468949943545352, "percentage": 61.75, "elapsed_time": "22:25:10", "remaining_time": "13:53:21"}
|
| 249 |
+
{"current_steps": 2470, "total_steps": 3984, "loss": 0.6567, "lr": 5e-06, "epoch": 2.4789863254296827, "percentage": 62.0, "elapsed_time": "22:30:29", "remaining_time": "13:47:47"}
|
| 250 |
+
{"current_steps": 2480, "total_steps": 3984, "loss": 0.6461, "lr": 5e-06, "epoch": 2.4890227073140134, "percentage": 62.25, "elapsed_time": "22:35:48", "remaining_time": "13:42:13"}
|
| 251 |
+
{"current_steps": 2490, "total_steps": 3984, "loss": 0.65, "lr": 5e-06, "epoch": 2.499059089198344, "percentage": 62.5, "elapsed_time": "22:41:08", "remaining_time": "13:36:41"}
|
| 252 |
+
{"current_steps": 2500, "total_steps": 3984, "loss": 0.6566, "lr": 5e-06, "epoch": 2.5090954710826745, "percentage": 62.75, "elapsed_time": "22:46:29", "remaining_time": "13:31:09"}
|
| 253 |
+
{"current_steps": 2510, "total_steps": 3984, "loss": 0.6525, "lr": 5e-06, "epoch": 2.5191318529670053, "percentage": 63.0, "elapsed_time": "22:51:49", "remaining_time": "13:25:36"}
|
| 254 |
+
{"current_steps": 2520, "total_steps": 3984, "loss": 0.6477, "lr": 5e-06, "epoch": 2.529168234851336, "percentage": 63.25, "elapsed_time": "22:57:11", "remaining_time": "13:20:04"}
|
| 255 |
+
{"current_steps": 2530, "total_steps": 3984, "loss": 0.6484, "lr": 5e-06, "epoch": 2.5392046167356668, "percentage": 63.5, "elapsed_time": "23:02:31", "remaining_time": "13:14:32"}
|
| 256 |
+
{"current_steps": 2540, "total_steps": 3984, "loss": 0.6498, "lr": 5e-06, "epoch": 2.5492409986199975, "percentage": 63.76, "elapsed_time": "23:07:51", "remaining_time": "13:09:00"}
|
| 257 |
+
{"current_steps": 2550, "total_steps": 3984, "loss": 0.6529, "lr": 5e-06, "epoch": 2.5592773805043283, "percentage": 64.01, "elapsed_time": "23:13:10", "remaining_time": "13:03:27"}
|
| 258 |
+
{"current_steps": 2560, "total_steps": 3984, "loss": 0.6496, "lr": 5e-06, "epoch": 2.569313762388659, "percentage": 64.26, "elapsed_time": "23:18:30", "remaining_time": "12:57:55"}
|
| 259 |
+
{"current_steps": 2570, "total_steps": 3984, "loss": 0.6488, "lr": 5e-06, "epoch": 2.57935014427299, "percentage": 64.51, "elapsed_time": "23:23:50", "remaining_time": "12:52:23"}
|
| 260 |
+
{"current_steps": 2580, "total_steps": 3984, "loss": 0.6605, "lr": 5e-06, "epoch": 2.58938652615732, "percentage": 64.76, "elapsed_time": "23:29:10", "remaining_time": "12:46:51"}
|
| 261 |
+
{"current_steps": 2590, "total_steps": 3984, "loss": 0.6474, "lr": 5e-06, "epoch": 2.599422908041651, "percentage": 65.01, "elapsed_time": "23:34:31", "remaining_time": "12:41:19"}
|
| 262 |
+
{"current_steps": 2600, "total_steps": 3984, "loss": 0.6532, "lr": 5e-06, "epoch": 2.6094592899259816, "percentage": 65.26, "elapsed_time": "23:39:51", "remaining_time": "12:35:47"}
|
| 263 |
+
{"current_steps": 2610, "total_steps": 3984, "loss": 0.6527, "lr": 5e-06, "epoch": 2.6194956718103124, "percentage": 65.51, "elapsed_time": "23:45:10", "remaining_time": "12:30:15"}
|
| 264 |
+
{"current_steps": 2620, "total_steps": 3984, "loss": 0.6465, "lr": 5e-06, "epoch": 2.629532053694643, "percentage": 65.76, "elapsed_time": "23:50:29", "remaining_time": "12:24:43"}
|
| 265 |
+
{"current_steps": 2630, "total_steps": 3984, "loss": 0.6489, "lr": 5e-06, "epoch": 2.639568435578974, "percentage": 66.01, "elapsed_time": "23:55:48", "remaining_time": "12:19:11"}
|
| 266 |
+
{"current_steps": 2640, "total_steps": 3984, "loss": 0.6523, "lr": 5e-06, "epoch": 2.6496048174633042, "percentage": 66.27, "elapsed_time": "1 day, 0:01:09", "remaining_time": "12:13:40"}
|
| 267 |
+
{"current_steps": 2650, "total_steps": 3984, "loss": 0.6528, "lr": 5e-06, "epoch": 2.659641199347635, "percentage": 66.52, "elapsed_time": "1 day, 0:06:30", "remaining_time": "12:08:10"}
|
| 268 |
+
{"current_steps": 2660, "total_steps": 3984, "loss": 0.6474, "lr": 5e-06, "epoch": 2.6696775812319657, "percentage": 66.77, "elapsed_time": "1 day, 0:11:49", "remaining_time": "12:02:38"}
|
| 269 |
+
{"current_steps": 2670, "total_steps": 3984, "loss": 0.6512, "lr": 5e-06, "epoch": 2.6797139631162965, "percentage": 67.02, "elapsed_time": "1 day, 0:17:09", "remaining_time": "11:57:07"}
|
| 270 |
+
{"current_steps": 2680, "total_steps": 3984, "loss": 0.6503, "lr": 5e-06, "epoch": 2.6897503450006273, "percentage": 67.27, "elapsed_time": "1 day, 0:22:30", "remaining_time": "11:51:36"}
|
| 271 |
+
{"current_steps": 2690, "total_steps": 3984, "loss": 0.6496, "lr": 5e-06, "epoch": 2.699786726884958, "percentage": 67.52, "elapsed_time": "1 day, 0:27:51", "remaining_time": "11:46:05"}
|
| 272 |
+
{"current_steps": 2700, "total_steps": 3984, "loss": 0.6521, "lr": 5e-06, "epoch": 2.709823108769289, "percentage": 67.77, "elapsed_time": "1 day, 0:33:12", "remaining_time": "11:40:35"}
|
| 273 |
+
{"current_steps": 2710, "total_steps": 3984, "loss": 0.6509, "lr": 5e-06, "epoch": 2.7198594906536195, "percentage": 68.02, "elapsed_time": "1 day, 0:38:33", "remaining_time": "11:35:05"}
|
| 274 |
+
{"current_steps": 2720, "total_steps": 3984, "loss": 0.6519, "lr": 5e-06, "epoch": 2.7298958725379503, "percentage": 68.27, "elapsed_time": "1 day, 0:43:53", "remaining_time": "11:29:34"}
|
| 275 |
+
{"current_steps": 2730, "total_steps": 3984, "loss": 0.6541, "lr": 5e-06, "epoch": 2.7399322544222806, "percentage": 68.52, "elapsed_time": "1 day, 0:49:13", "remaining_time": "11:24:03"}
|
| 276 |
+
{"current_steps": 2740, "total_steps": 3984, "loss": 0.6548, "lr": 5e-06, "epoch": 2.7499686363066114, "percentage": 68.78, "elapsed_time": "1 day, 0:54:33", "remaining_time": "11:18:33"}
|
| 277 |
+
{"current_steps": 2750, "total_steps": 3984, "loss": 0.6525, "lr": 5e-06, "epoch": 2.760005018190942, "percentage": 69.03, "elapsed_time": "1 day, 0:59:54", "remaining_time": "11:13:02"}
|
| 278 |
+
{"current_steps": 2760, "total_steps": 3984, "loss": 0.6596, "lr": 5e-06, "epoch": 2.770041400075273, "percentage": 69.28, "elapsed_time": "1 day, 1:05:15", "remaining_time": "11:07:33"}
|
| 279 |
+
{"current_steps": 2770, "total_steps": 3984, "loss": 0.6521, "lr": 5e-06, "epoch": 2.7800777819596036, "percentage": 69.53, "elapsed_time": "1 day, 1:10:38", "remaining_time": "11:02:03"}
|
| 280 |
+
{"current_steps": 2780, "total_steps": 3984, "loss": 0.6506, "lr": 5e-06, "epoch": 2.7901141638439344, "percentage": 69.78, "elapsed_time": "1 day, 1:15:59", "remaining_time": "10:56:34"}
|
| 281 |
+
{"current_steps": 2790, "total_steps": 3984, "loss": 0.6542, "lr": 5e-06, "epoch": 2.8001505457282647, "percentage": 70.03, "elapsed_time": "1 day, 1:21:21", "remaining_time": "10:51:04"}
|
| 282 |
+
{"current_steps": 2800, "total_steps": 3984, "loss": 0.6545, "lr": 5e-06, "epoch": 2.8101869276125955, "percentage": 70.28, "elapsed_time": "1 day, 1:26:40", "remaining_time": "10:45:34"}
|
| 283 |
+
{"current_steps": 2810, "total_steps": 3984, "loss": 0.6539, "lr": 5e-06, "epoch": 2.8202233094969262, "percentage": 70.53, "elapsed_time": "1 day, 1:32:00", "remaining_time": "10:40:03"}
|
| 284 |
+
{"current_steps": 2820, "total_steps": 3984, "loss": 0.6497, "lr": 5e-06, "epoch": 2.830259691381257, "percentage": 70.78, "elapsed_time": "1 day, 1:37:20", "remaining_time": "10:34:33"}
|
| 285 |
+
{"current_steps": 2830, "total_steps": 3984, "loss": 0.6513, "lr": 5e-06, "epoch": 2.8402960732655878, "percentage": 71.03, "elapsed_time": "1 day, 1:42:39", "remaining_time": "10:29:03"}
|
| 286 |
+
{"current_steps": 2840, "total_steps": 3984, "loss": 0.6507, "lr": 5e-06, "epoch": 2.8503324551499185, "percentage": 71.29, "elapsed_time": "1 day, 1:48:01", "remaining_time": "10:23:34"}
|
| 287 |
+
{"current_steps": 2850, "total_steps": 3984, "loss": 0.6581, "lr": 5e-06, "epoch": 2.8603688370342493, "percentage": 71.54, "elapsed_time": "1 day, 1:53:23", "remaining_time": "10:18:05"}
|
| 288 |
+
{"current_steps": 2860, "total_steps": 3984, "loss": 0.6516, "lr": 5e-06, "epoch": 2.87040521891858, "percentage": 71.79, "elapsed_time": "1 day, 1:58:43", "remaining_time": "10:12:35"}
|
| 289 |
+
{"current_steps": 2870, "total_steps": 3984, "loss": 0.6511, "lr": 5e-06, "epoch": 2.880441600802911, "percentage": 72.04, "elapsed_time": "1 day, 2:04:05", "remaining_time": "10:07:06"}
|
| 290 |
+
{"current_steps": 2880, "total_steps": 3984, "loss": 0.6539, "lr": 5e-06, "epoch": 2.890477982687241, "percentage": 72.29, "elapsed_time": "1 day, 2:09:27", "remaining_time": "10:01:37"}
|
| 291 |
+
{"current_steps": 2890, "total_steps": 3984, "loss": 0.6512, "lr": 5e-06, "epoch": 2.900514364571572, "percentage": 72.54, "elapsed_time": "1 day, 2:14:47", "remaining_time": "9:56:07"}
|
| 292 |
+
{"current_steps": 2900, "total_steps": 3984, "loss": 0.6538, "lr": 5e-06, "epoch": 2.9105507464559026, "percentage": 72.79, "elapsed_time": "1 day, 2:20:08", "remaining_time": "9:50:38"}
|
| 293 |
+
{"current_steps": 2910, "total_steps": 3984, "loss": 0.6504, "lr": 5e-06, "epoch": 2.9205871283402334, "percentage": 73.04, "elapsed_time": "1 day, 2:25:30", "remaining_time": "9:45:09"}
|
| 294 |
+
{"current_steps": 2920, "total_steps": 3984, "loss": 0.6494, "lr": 5e-06, "epoch": 2.930623510224564, "percentage": 73.29, "elapsed_time": "1 day, 2:30:49", "remaining_time": "9:39:40"}
|
| 295 |
+
{"current_steps": 2930, "total_steps": 3984, "loss": 0.6512, "lr": 5e-06, "epoch": 2.940659892108895, "percentage": 73.54, "elapsed_time": "1 day, 2:36:08", "remaining_time": "9:34:10"}
|
| 296 |
+
{"current_steps": 2940, "total_steps": 3984, "loss": 0.655, "lr": 5e-06, "epoch": 2.950696273993225, "percentage": 73.8, "elapsed_time": "1 day, 2:41:27", "remaining_time": "9:28:40"}
|
| 297 |
+
{"current_steps": 2950, "total_steps": 3984, "loss": 0.6531, "lr": 5e-06, "epoch": 2.960732655877556, "percentage": 74.05, "elapsed_time": "1 day, 2:46:48", "remaining_time": "9:23:12"}
|
| 298 |
+
{"current_steps": 2960, "total_steps": 3984, "loss": 0.6551, "lr": 5e-06, "epoch": 2.9707690377618867, "percentage": 74.3, "elapsed_time": "1 day, 2:52:10", "remaining_time": "9:17:43"}
|
| 299 |
+
{"current_steps": 2970, "total_steps": 3984, "loss": 0.6553, "lr": 5e-06, "epoch": 2.9808054196462175, "percentage": 74.55, "elapsed_time": "1 day, 2:57:28", "remaining_time": "9:12:13"}
|
| 300 |
+
{"current_steps": 2980, "total_steps": 3984, "loss": 0.6511, "lr": 5e-06, "epoch": 2.9908418015305482, "percentage": 74.8, "elapsed_time": "1 day, 3:02:47", "remaining_time": "9:06:44"}
|
| 301 |
+
{"current_steps": 2989, "total_steps": 3984, "eval_loss": 0.7148573994636536, "epoch": 2.999874545226446, "percentage": 75.03, "elapsed_time": "1 day, 3:18:43", "remaining_time": "9:05:30"}
|
| 302 |
+
{"current_steps": 2990, "total_steps": 3984, "loss": 0.6887, "lr": 5e-06, "epoch": 3.000878183414879, "percentage": 75.05, "elapsed_time": "1 day, 3:20:29", "remaining_time": "9:05:21"}
|