Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c0f5a141bdcbd87eaec7f19ed08de21401b5d84fc8adbf141811fe3cc6d84512
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:837cb881a4501b2164a8cdd444ab6552aafce76bce2c4e65c19201cc88a05782
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8dd107eeb00bc0d474f8d73ec8ac2067e75050dc6bae92f321ce255e47afcfbf
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:86edd7e08e1690c559e435b6ee165e96b2359b95d74e89b095dd6a4235979492
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -246,3 +246,114 @@
|
|
| 246 |
{"current_steps": 221, "total_steps": 550, "loss": 0.3732, "lr": 5.977974420901908e-05, "epoch": 2.004524886877828, "percentage": 40.18, "elapsed_time": "3:04:02", "remaining_time": "4:33:58"}
|
| 247 |
{"current_steps": 222, "total_steps": 550, "loss": 0.3539, "lr": 5.955869169282556e-05, "epoch": 2.013574660633484, "percentage": 40.36, "elapsed_time": "3:04:50", "remaining_time": "4:33:06"}
|
| 248 |
{"current_steps": 223, "total_steps": 550, "loss": 0.3625, "lr": 5.9336851355382557e-05, "epoch": 2.02262443438914, "percentage": 40.55, "elapsed_time": "3:05:39", "remaining_time": "4:32:15"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 246 |
{"current_steps": 221, "total_steps": 550, "loss": 0.3732, "lr": 5.977974420901908e-05, "epoch": 2.004524886877828, "percentage": 40.18, "elapsed_time": "3:04:02", "remaining_time": "4:33:58"}
|
| 247 |
{"current_steps": 222, "total_steps": 550, "loss": 0.3539, "lr": 5.955869169282556e-05, "epoch": 2.013574660633484, "percentage": 40.36, "elapsed_time": "3:04:50", "remaining_time": "4:33:06"}
|
| 248 |
{"current_steps": 223, "total_steps": 550, "loss": 0.3625, "lr": 5.9336851355382557e-05, "epoch": 2.02262443438914, "percentage": 40.55, "elapsed_time": "3:05:39", "remaining_time": "4:32:15"}
|
| 249 |
+
{"current_steps": 224, "total_steps": 550, "loss": 0.3565, "lr": 5.911423213238653e-05, "epoch": 2.0316742081447963, "percentage": 40.73, "elapsed_time": "3:06:29", "remaining_time": "4:31:24"}
|
| 250 |
+
{"current_steps": 225, "total_steps": 550, "loss": 0.3562, "lr": 5.889084299090732e-05, "epoch": 2.0407239819004523, "percentage": 40.91, "elapsed_time": "3:07:17", "remaining_time": "4:30:32"}
|
| 251 |
+
{"current_steps": 226, "total_steps": 550, "loss": 0.36, "lr": 5.866669292902695e-05, "epoch": 2.0497737556561084, "percentage": 41.09, "elapsed_time": "3:08:06", "remaining_time": "4:29:41"}
|
| 252 |
+
{"current_steps": 227, "total_steps": 550, "loss": 0.3602, "lr": 5.844179097547725e-05, "epoch": 2.0588235294117645, "percentage": 41.27, "elapsed_time": "3:08:55", "remaining_time": "4:28:49"}
|
| 253 |
+
{"current_steps": 228, "total_steps": 550, "loss": 0.3571, "lr": 5.821614618927613e-05, "epoch": 2.067873303167421, "percentage": 41.45, "elapsed_time": "3:09:44", "remaining_time": "4:27:57"}
|
| 254 |
+
{"current_steps": 229, "total_steps": 550, "loss": 0.3559, "lr": 5.798976765936264e-05, "epoch": 2.076923076923077, "percentage": 41.64, "elapsed_time": "3:10:32", "remaining_time": "4:27:05"}
|
| 255 |
+
{"current_steps": 230, "total_steps": 550, "loss": 0.355, "lr": 5.776266450423097e-05, "epoch": 2.085972850678733, "percentage": 41.82, "elapsed_time": "3:11:21", "remaining_time": "4:26:14"}
|
| 256 |
+
{"current_steps": 231, "total_steps": 550, "loss": 0.3595, "lr": 5.75348458715631e-05, "epoch": 2.0950226244343892, "percentage": 42.0, "elapsed_time": "3:12:10", "remaining_time": "4:25:22"}
|
| 257 |
+
{"current_steps": 232, "total_steps": 550, "loss": 0.352, "lr": 5.7306320937860336e-05, "epoch": 2.1040723981900453, "percentage": 42.18, "elapsed_time": "3:12:58", "remaining_time": "4:24:30"}
|
| 258 |
+
{"current_steps": 233, "total_steps": 550, "loss": 0.3582, "lr": 5.7077098908073676e-05, "epoch": 2.1131221719457014, "percentage": 42.36, "elapsed_time": "3:13:47", "remaining_time": "4:23:38"}
|
| 259 |
+
{"current_steps": 234, "total_steps": 550, "loss": 0.3533, "lr": 5.684718901523307e-05, "epoch": 2.1221719457013575, "percentage": 42.55, "elapsed_time": "3:14:35", "remaining_time": "4:22:47"}
|
| 260 |
+
{"current_steps": 235, "total_steps": 550, "loss": 0.3564, "lr": 5.661660052007547e-05, "epoch": 2.1312217194570136, "percentage": 42.73, "elapsed_time": "3:15:24", "remaining_time": "4:21:55"}
|
| 261 |
+
{"current_steps": 236, "total_steps": 550, "loss": 0.3518, "lr": 5.6385342710671815e-05, "epoch": 2.1402714932126696, "percentage": 42.91, "elapsed_time": "3:16:13", "remaining_time": "4:21:04"}
|
| 262 |
+
{"current_steps": 237, "total_steps": 550, "loss": 0.3535, "lr": 5.6153424902053e-05, "epoch": 2.1493212669683257, "percentage": 43.09, "elapsed_time": "3:17:01", "remaining_time": "4:20:12"}
|
| 263 |
+
{"current_steps": 238, "total_steps": 550, "loss": 0.3548, "lr": 5.59208564358345e-05, "epoch": 2.158371040723982, "percentage": 43.27, "elapsed_time": "3:17:49", "remaining_time": "4:19:20"}
|
| 264 |
+
{"current_steps": 239, "total_steps": 550, "loss": 0.3605, "lr": 5.568764667984022e-05, "epoch": 2.167420814479638, "percentage": 43.45, "elapsed_time": "3:18:38", "remaining_time": "4:18:29"}
|
| 265 |
+
{"current_steps": 240, "total_steps": 550, "loss": 0.3538, "lr": 5.5453805027725145e-05, "epoch": 2.176470588235294, "percentage": 43.64, "elapsed_time": "3:19:27", "remaining_time": "4:17:37"}
|
| 266 |
+
{"current_steps": 241, "total_steps": 550, "loss": 0.3497, "lr": 5.521934089859692e-05, "epoch": 2.1855203619909505, "percentage": 43.82, "elapsed_time": "3:20:15", "remaining_time": "4:16:45"}
|
| 267 |
+
{"current_steps": 242, "total_steps": 550, "loss": 0.355, "lr": 5.4984263736636494e-05, "epoch": 2.1945701357466065, "percentage": 44.0, "elapsed_time": "3:21:04", "remaining_time": "4:15:54"}
|
| 268 |
+
{"current_steps": 243, "total_steps": 550, "loss": 0.3557, "lr": 5.4748583010717636e-05, "epoch": 2.2036199095022626, "percentage": 44.18, "elapsed_time": "3:21:53", "remaining_time": "4:15:03"}
|
| 269 |
+
{"current_steps": 244, "total_steps": 550, "loss": 0.362, "lr": 5.451230821402564e-05, "epoch": 2.2126696832579187, "percentage": 44.36, "elapsed_time": "3:22:41", "remaining_time": "4:14:11"}
|
| 270 |
+
{"current_steps": 245, "total_steps": 550, "loss": 0.3519, "lr": 5.427544886367488e-05, "epoch": 2.2217194570135748, "percentage": 44.55, "elapsed_time": "3:23:30", "remaining_time": "4:13:20"}
|
| 271 |
+
{"current_steps": 246, "total_steps": 550, "loss": 0.3551, "lr": 5.403801450032544e-05, "epoch": 2.230769230769231, "percentage": 44.73, "elapsed_time": "3:24:19", "remaining_time": "4:12:29"}
|
| 272 |
+
{"current_steps": 247, "total_steps": 550, "loss": 0.359, "lr": 5.380001468779883e-05, "epoch": 2.239819004524887, "percentage": 44.91, "elapsed_time": "3:25:07", "remaining_time": "4:11:38"}
|
| 273 |
+
{"current_steps": 248, "total_steps": 550, "loss": 0.3569, "lr": 5.356145901269282e-05, "epoch": 2.248868778280543, "percentage": 45.09, "elapsed_time": "3:25:56", "remaining_time": "4:10:46"}
|
| 274 |
+
{"current_steps": 249, "total_steps": 550, "loss": 0.3584, "lr": 5.3322357083995235e-05, "epoch": 2.257918552036199, "percentage": 45.27, "elapsed_time": "3:26:45", "remaining_time": "4:09:55"}
|
| 275 |
+
{"current_steps": 250, "total_steps": 550, "loss": 0.3527, "lr": 5.3082718532696874e-05, "epoch": 2.266968325791855, "percentage": 45.45, "elapsed_time": "3:27:33", "remaining_time": "4:09:04"}
|
| 276 |
+
{"current_steps": 251, "total_steps": 550, "loss": 0.3508, "lr": 5.284255301140364e-05, "epoch": 2.276018099547511, "percentage": 45.64, "elapsed_time": "3:28:22", "remaining_time": "4:08:13"}
|
| 277 |
+
{"current_steps": 252, "total_steps": 550, "loss": 0.3486, "lr": 5.2601870193947716e-05, "epoch": 2.2850678733031673, "percentage": 45.82, "elapsed_time": "3:29:10", "remaining_time": "4:07:21"}
|
| 278 |
+
{"current_steps": 253, "total_steps": 550, "loss": 0.3521, "lr": 5.23606797749979e-05, "epoch": 2.2941176470588234, "percentage": 46.0, "elapsed_time": "3:29:59", "remaining_time": "4:06:30"}
|
| 279 |
+
{"current_steps": 254, "total_steps": 550, "loss": 0.3506, "lr": 5.21189914696691e-05, "epoch": 2.3031674208144794, "percentage": 46.18, "elapsed_time": "3:30:48", "remaining_time": "4:05:39"}
|
| 280 |
+
{"current_steps": 255, "total_steps": 550, "loss": 0.3511, "lr": 5.1876815013131e-05, "epoch": 2.3122171945701355, "percentage": 46.36, "elapsed_time": "3:31:36", "remaining_time": "4:04:48"}
|
| 281 |
+
{"current_steps": 256, "total_steps": 550, "loss": 0.3537, "lr": 5.163416016021597e-05, "epoch": 2.321266968325792, "percentage": 46.55, "elapsed_time": "3:32:25", "remaining_time": "4:03:57"}
|
| 282 |
+
{"current_steps": 257, "total_steps": 550, "loss": 0.3492, "lr": 5.1391036685026093e-05, "epoch": 2.330316742081448, "percentage": 46.73, "elapsed_time": "3:33:13", "remaining_time": "4:03:06"}
|
| 283 |
+
{"current_steps": 258, "total_steps": 550, "loss": 0.3522, "lr": 5.114745438053952e-05, "epoch": 2.339366515837104, "percentage": 46.91, "elapsed_time": "3:34:02", "remaining_time": "4:02:14"}
|
| 284 |
+
{"current_steps": 259, "total_steps": 550, "loss": 0.3531, "lr": 5.0903423058215925e-05, "epoch": 2.3484162895927603, "percentage": 47.09, "elapsed_time": "3:34:51", "remaining_time": "4:01:23"}
|
| 285 |
+
{"current_steps": 260, "total_steps": 550, "loss": 0.3509, "lr": 5.06589525476014e-05, "epoch": 2.3574660633484164, "percentage": 47.27, "elapsed_time": "3:35:39", "remaining_time": "4:00:32"}
|
| 286 |
+
{"current_steps": 261, "total_steps": 550, "loss": 0.3539, "lr": 5.0414052695932486e-05, "epoch": 2.3665158371040724, "percentage": 47.45, "elapsed_time": "3:36:28", "remaining_time": "3:59:41"}
|
| 287 |
+
{"current_steps": 262, "total_steps": 550, "loss": 0.3513, "lr": 5.016873336773949e-05, "epoch": 2.3755656108597285, "percentage": 47.64, "elapsed_time": "3:37:17", "remaining_time": "3:58:50"}
|
| 288 |
+
{"current_steps": 263, "total_steps": 550, "loss": 0.3569, "lr": 4.992300444444916e-05, "epoch": 2.3846153846153846, "percentage": 47.82, "elapsed_time": "3:38:05", "remaining_time": "3:57:59"}
|
| 289 |
+
{"current_steps": 264, "total_steps": 550, "loss": 0.3532, "lr": 4.967687582398671e-05, "epoch": 2.3936651583710407, "percentage": 48.0, "elapsed_time": "3:38:53", "remaining_time": "3:57:08"}
|
| 290 |
+
{"current_steps": 265, "total_steps": 550, "loss": 0.3546, "lr": 4.94303574203771e-05, "epoch": 2.4027149321266967, "percentage": 48.18, "elapsed_time": "3:39:42", "remaining_time": "3:56:17"}
|
| 291 |
+
{"current_steps": 266, "total_steps": 550, "loss": 0.3502, "lr": 4.9183459163345644e-05, "epoch": 2.411764705882353, "percentage": 48.36, "elapsed_time": "3:40:30", "remaining_time": "3:55:26"}
|
| 292 |
+
{"current_steps": 267, "total_steps": 550, "loss": 0.3522, "lr": 4.893619099791817e-05, "epoch": 2.420814479638009, "percentage": 48.55, "elapsed_time": "3:41:19", "remaining_time": "3:54:35"}
|
| 293 |
+
{"current_steps": 268, "total_steps": 550, "loss": 0.356, "lr": 4.868856288402032e-05, "epoch": 2.4298642533936654, "percentage": 48.73, "elapsed_time": "3:42:07", "remaining_time": "3:53:44"}
|
| 294 |
+
{"current_steps": 269, "total_steps": 550, "loss": 0.3534, "lr": 4.8440584796076395e-05, "epoch": 2.4389140271493215, "percentage": 48.91, "elapsed_time": "3:42:56", "remaining_time": "3:52:53"}
|
| 295 |
+
{"current_steps": 270, "total_steps": 550, "loss": 0.3592, "lr": 4.819226672260763e-05, "epoch": 2.4479638009049776, "percentage": 49.09, "elapsed_time": "3:43:45", "remaining_time": "3:52:02"}
|
| 296 |
+
{"current_steps": 271, "total_steps": 550, "loss": 0.3552, "lr": 4.794361866582982e-05, "epoch": 2.4570135746606336, "percentage": 49.27, "elapsed_time": "3:44:33", "remaining_time": "3:51:11"}
|
| 297 |
+
{"current_steps": 272, "total_steps": 550, "loss": 0.3531, "lr": 4.7694650641250446e-05, "epoch": 2.4660633484162897, "percentage": 49.45, "elapsed_time": "3:45:22", "remaining_time": "3:50:20"}
|
| 298 |
+
{"current_steps": 273, "total_steps": 550, "loss": 0.3554, "lr": 4.7445372677265205e-05, "epoch": 2.475113122171946, "percentage": 49.64, "elapsed_time": "3:46:10", "remaining_time": "3:49:29"}
|
| 299 |
+
{"current_steps": 274, "total_steps": 550, "loss": 0.3558, "lr": 4.719579481475416e-05, "epoch": 2.484162895927602, "percentage": 49.82, "elapsed_time": "3:46:59", "remaining_time": "3:48:38"}
|
| 300 |
+
{"current_steps": 275, "total_steps": 550, "loss": 0.3558, "lr": 4.694592710667723e-05, "epoch": 2.493212669683258, "percentage": 50.0, "elapsed_time": "3:47:48", "remaining_time": "3:47:48"}
|
| 301 |
+
{"current_steps": 276, "total_steps": 550, "loss": 0.355, "lr": 4.6695779617669236e-05, "epoch": 2.502262443438914, "percentage": 50.18, "elapsed_time": "3:48:37", "remaining_time": "3:46:57"}
|
| 302 |
+
{"current_steps": 277, "total_steps": 550, "loss": 0.3547, "lr": 4.6445362423634574e-05, "epoch": 2.51131221719457, "percentage": 50.36, "elapsed_time": "3:49:25", "remaining_time": "3:46:07"}
|
| 303 |
+
{"current_steps": 278, "total_steps": 550, "loss": 0.3524, "lr": 4.61946856113413e-05, "epoch": 2.520361990950226, "percentage": 50.55, "elapsed_time": "3:50:14", "remaining_time": "3:45:16"}
|
| 304 |
+
{"current_steps": 279, "total_steps": 550, "loss": 0.3518, "lr": 4.594375927801487e-05, "epoch": 2.5294117647058822, "percentage": 50.73, "elapsed_time": "3:51:03", "remaining_time": "3:44:25"}
|
| 305 |
+
{"current_steps": 280, "total_steps": 550, "loss": 0.3551, "lr": 4.5692593530931416e-05, "epoch": 2.5384615384615383, "percentage": 50.91, "elapsed_time": "3:51:52", "remaining_time": "3:43:35"}
|
| 306 |
+
{"current_steps": 281, "total_steps": 550, "loss": 0.3546, "lr": 4.5441198487010574e-05, "epoch": 2.5475113122171944, "percentage": 51.09, "elapsed_time": "3:52:40", "remaining_time": "3:42:44"}
|
| 307 |
+
{"current_steps": 282, "total_steps": 550, "loss": 0.3521, "lr": 4.5189584272408074e-05, "epoch": 2.5565610859728505, "percentage": 51.27, "elapsed_time": "3:53:29", "remaining_time": "3:41:54"}
|
| 308 |
+
{"current_steps": 283, "total_steps": 550, "loss": 0.351, "lr": 4.493776102210779e-05, "epoch": 2.5656108597285066, "percentage": 51.45, "elapsed_time": "3:54:18", "remaining_time": "3:41:03"}
|
| 309 |
+
{"current_steps": 284, "total_steps": 550, "loss": 0.352, "lr": 4.468573887951354e-05, "epoch": 2.5746606334841626, "percentage": 51.64, "elapsed_time": "3:55:06", "remaining_time": "3:40:12"}
|
| 310 |
+
{"current_steps": 285, "total_steps": 550, "loss": 0.3555, "lr": 4.4433527996040443e-05, "epoch": 2.583710407239819, "percentage": 51.82, "elapsed_time": "3:55:55", "remaining_time": "3:39:21"}
|
| 311 |
+
{"current_steps": 286, "total_steps": 550, "loss": 0.3534, "lr": 4.418113853070614e-05, "epoch": 2.5927601809954752, "percentage": 52.0, "elapsed_time": "3:56:43", "remaining_time": "3:38:31"}
|
| 312 |
+
{"current_steps": 287, "total_steps": 550, "loss": 0.3555, "lr": 4.392858064972149e-05, "epoch": 2.6018099547511313, "percentage": 52.18, "elapsed_time": "3:57:32", "remaining_time": "3:37:40"}
|
| 313 |
+
{"current_steps": 288, "total_steps": 550, "loss": 0.3522, "lr": 4.3675864526081106e-05, "epoch": 2.6108597285067874, "percentage": 52.36, "elapsed_time": "3:58:20", "remaining_time": "3:36:49"}
|
| 314 |
+
{"current_steps": 289, "total_steps": 550, "loss": 0.3529, "lr": 4.34230003391536e-05, "epoch": 2.6199095022624435, "percentage": 52.55, "elapsed_time": "3:59:08", "remaining_time": "3:35:58"}
|
| 315 |
+
{"current_steps": 290, "total_steps": 550, "loss": 0.3501, "lr": 4.316999827427154e-05, "epoch": 2.6289592760180995, "percentage": 52.73, "elapsed_time": "3:59:57", "remaining_time": "3:35:07"}
|
| 316 |
+
{"current_steps": 291, "total_steps": 550, "loss": 0.3593, "lr": 4.2916868522321235e-05, "epoch": 2.6380090497737556, "percentage": 52.91, "elapsed_time": "4:00:45", "remaining_time": "3:34:17"}
|
| 317 |
+
{"current_steps": 292, "total_steps": 550, "loss": 0.3542, "lr": 4.266362127933216e-05, "epoch": 2.6470588235294117, "percentage": 53.09, "elapsed_time": "4:01:33", "remaining_time": "3:33:26"}
|
| 318 |
+
{"current_steps": 293, "total_steps": 550, "loss": 0.3529, "lr": 4.2410266746066345e-05, "epoch": 2.6561085972850678, "percentage": 53.27, "elapsed_time": "4:02:22", "remaining_time": "3:32:35"}
|
| 319 |
+
{"current_steps": 294, "total_steps": 550, "loss": 0.3545, "lr": 4.215681512760744e-05, "epoch": 2.665158371040724, "percentage": 53.45, "elapsed_time": "4:03:10", "remaining_time": "3:31:44"}
|
| 320 |
+
{"current_steps": 295, "total_steps": 550, "loss": 0.3533, "lr": 4.19032766329497e-05, "epoch": 2.6742081447963804, "percentage": 53.64, "elapsed_time": "4:03:59", "remaining_time": "3:30:54"}
|
| 321 |
+
{"current_steps": 296, "total_steps": 550, "loss": 0.3543, "lr": 4.1649661474586694e-05, "epoch": 2.6832579185520364, "percentage": 53.82, "elapsed_time": "4:04:48", "remaining_time": "3:30:04"}
|
| 322 |
+
{"current_steps": 297, "total_steps": 550, "loss": 0.3569, "lr": 4.139597986810005e-05, "epoch": 2.6923076923076925, "percentage": 54.0, "elapsed_time": "4:05:36", "remaining_time": "3:29:13"}
|
| 323 |
+
{"current_steps": 298, "total_steps": 550, "loss": 0.3496, "lr": 4.114224203174785e-05, "epoch": 2.7013574660633486, "percentage": 54.18, "elapsed_time": "4:06:25", "remaining_time": "3:28:22"}
|
| 324 |
+
{"current_steps": 299, "total_steps": 550, "loss": 0.354, "lr": 4.0888458186053184e-05, "epoch": 2.7104072398190047, "percentage": 54.36, "elapsed_time": "4:07:13", "remaining_time": "3:27:32"}
|
| 325 |
+
{"current_steps": 300, "total_steps": 550, "loss": 0.3496, "lr": 4.063463855339232e-05, "epoch": 2.7194570135746607, "percentage": 54.55, "elapsed_time": "4:08:01", "remaining_time": "3:26:41"}
|
| 326 |
+
{"current_steps": 301, "total_steps": 550, "loss": 0.3491, "lr": 4.0380793357583076e-05, "epoch": 2.728506787330317, "percentage": 54.73, "elapsed_time": "4:08:50", "remaining_time": "3:25:51"}
|
| 327 |
+
{"current_steps": 302, "total_steps": 550, "loss": 0.3564, "lr": 4.012693282347289e-05, "epoch": 2.737556561085973, "percentage": 54.91, "elapsed_time": "4:09:39", "remaining_time": "3:25:00"}
|
| 328 |
+
{"current_steps": 303, "total_steps": 550, "loss": 0.3544, "lr": 3.9873067176527114e-05, "epoch": 2.746606334841629, "percentage": 55.09, "elapsed_time": "4:10:27", "remaining_time": "3:24:10"}
|
| 329 |
+
{"current_steps": 304, "total_steps": 550, "loss": 0.3546, "lr": 3.961920664241694e-05, "epoch": 2.755656108597285, "percentage": 55.27, "elapsed_time": "4:11:15", "remaining_time": "3:23:19"}
|
| 330 |
+
{"current_steps": 305, "total_steps": 550, "loss": 0.355, "lr": 3.9365361446607684e-05, "epoch": 2.764705882352941, "percentage": 55.45, "elapsed_time": "4:12:04", "remaining_time": "3:22:29"}
|
| 331 |
+
{"current_steps": 306, "total_steps": 550, "loss": 0.3564, "lr": 3.911154181394682e-05, "epoch": 2.773755656108597, "percentage": 55.64, "elapsed_time": "4:12:53", "remaining_time": "3:21:38"}
|
| 332 |
+
{"current_steps": 307, "total_steps": 550, "loss": 0.3548, "lr": 3.885775796825216e-05, "epoch": 2.7828054298642533, "percentage": 55.82, "elapsed_time": "4:13:41", "remaining_time": "3:20:48"}
|
| 333 |
+
{"current_steps": 308, "total_steps": 550, "loss": 0.3485, "lr": 3.860402013189998e-05, "epoch": 2.7918552036199094, "percentage": 56.0, "elapsed_time": "4:14:30", "remaining_time": "3:19:58"}
|
| 334 |
+
{"current_steps": 309, "total_steps": 550, "loss": 0.3562, "lr": 3.835033852541332e-05, "epoch": 2.8009049773755654, "percentage": 56.18, "elapsed_time": "4:15:19", "remaining_time": "3:19:07"}
|
| 335 |
+
{"current_steps": 310, "total_steps": 550, "loss": 0.348, "lr": 3.809672336705031e-05, "epoch": 2.8099547511312215, "percentage": 56.36, "elapsed_time": "4:16:07", "remaining_time": "3:18:17"}
|
| 336 |
+
{"current_steps": 311, "total_steps": 550, "loss": 0.3546, "lr": 3.784318487239257e-05, "epoch": 2.8190045248868776, "percentage": 56.55, "elapsed_time": "4:16:56", "remaining_time": "3:17:27"}
|
| 337 |
+
{"current_steps": 312, "total_steps": 550, "loss": 0.35, "lr": 3.758973325393367e-05, "epoch": 2.8280542986425337, "percentage": 56.73, "elapsed_time": "4:17:44", "remaining_time": "3:16:36"}
|
| 338 |
+
{"current_steps": 313, "total_steps": 550, "loss": 0.3537, "lr": 3.7336378720667846e-05, "epoch": 2.83710407239819, "percentage": 56.91, "elapsed_time": "4:18:33", "remaining_time": "3:15:46"}
|
| 339 |
+
{"current_steps": 314, "total_steps": 550, "loss": 0.3543, "lr": 3.708313147767878e-05, "epoch": 2.8461538461538463, "percentage": 57.09, "elapsed_time": "4:19:21", "remaining_time": "3:14:56"}
|
| 340 |
+
{"current_steps": 315, "total_steps": 550, "loss": 0.3544, "lr": 3.683000172572846e-05, "epoch": 2.8552036199095023, "percentage": 57.27, "elapsed_time": "4:20:10", "remaining_time": "3:14:05"}
|
| 341 |
+
{"current_steps": 316, "total_steps": 550, "loss": 0.3531, "lr": 3.657699966084642e-05, "epoch": 2.8642533936651584, "percentage": 57.45, "elapsed_time": "4:20:58", "remaining_time": "3:13:15"}
|
| 342 |
+
{"current_steps": 317, "total_steps": 550, "loss": 0.3556, "lr": 3.632413547391891e-05, "epoch": 2.8733031674208145, "percentage": 57.64, "elapsed_time": "4:21:47", "remaining_time": "3:12:25"}
|
| 343 |
+
{"current_steps": 318, "total_steps": 550, "loss": 0.3471, "lr": 3.6071419350278515e-05, "epoch": 2.8823529411764706, "percentage": 57.82, "elapsed_time": "4:22:35", "remaining_time": "3:11:34"}
|
| 344 |
+
{"current_steps": 319, "total_steps": 550, "loss": 0.3451, "lr": 3.581886146929387e-05, "epoch": 2.8914027149321266, "percentage": 58.0, "elapsed_time": "4:23:24", "remaining_time": "3:10:44"}
|
| 345 |
+
{"current_steps": 320, "total_steps": 550, "loss": 0.352, "lr": 3.556647200395956e-05, "epoch": 2.9004524886877827, "percentage": 58.18, "elapsed_time": "4:24:12", "remaining_time": "3:09:54"}
|
| 346 |
+
{"current_steps": 321, "total_steps": 550, "loss": 0.3493, "lr": 3.5314261120486474e-05, "epoch": 2.909502262443439, "percentage": 58.36, "elapsed_time": "4:25:01", "remaining_time": "3:09:03"}
|
| 347 |
+
{"current_steps": 322, "total_steps": 550, "loss": 0.3508, "lr": 3.5062238977892214e-05, "epoch": 2.918552036199095, "percentage": 58.55, "elapsed_time": "4:25:49", "remaining_time": "3:08:13"}
|
| 348 |
+
{"current_steps": 323, "total_steps": 550, "loss": 0.355, "lr": 3.481041572759193e-05, "epoch": 2.9276018099547514, "percentage": 58.73, "elapsed_time": "4:26:38", "remaining_time": "3:07:23"}
|
| 349 |
+
{"current_steps": 324, "total_steps": 550, "loss": 0.354, "lr": 3.4558801512989446e-05, "epoch": 2.9366515837104075, "percentage": 58.91, "elapsed_time": "4:27:26", "remaining_time": "3:06:33"}
|
| 350 |
+
{"current_steps": 325, "total_steps": 550, "loss": 0.3542, "lr": 3.4307406469068604e-05, "epoch": 2.9457013574660635, "percentage": 59.09, "elapsed_time": "4:28:15", "remaining_time": "3:05:43"}
|
| 351 |
+
{"current_steps": 326, "total_steps": 550, "loss": 0.3553, "lr": 3.405624072198514e-05, "epoch": 2.9547511312217196, "percentage": 59.27, "elapsed_time": "4:29:04", "remaining_time": "3:04:52"}
|
| 352 |
+
{"current_steps": 327, "total_steps": 550, "loss": 0.3507, "lr": 3.3805314388658714e-05, "epoch": 2.9638009049773757, "percentage": 59.45, "elapsed_time": "4:29:52", "remaining_time": "3:04:02"}
|
| 353 |
+
{"current_steps": 328, "total_steps": 550, "loss": 0.3469, "lr": 3.3554637576365446e-05, "epoch": 2.9728506787330318, "percentage": 59.64, "elapsed_time": "4:30:41", "remaining_time": "3:03:12"}
|
| 354 |
+
{"current_steps": 329, "total_steps": 550, "loss": 0.3499, "lr": 3.330422038233078e-05, "epoch": 2.981900452488688, "percentage": 59.82, "elapsed_time": "4:31:29", "remaining_time": "3:02:22"}
|
| 355 |
+
{"current_steps": 330, "total_steps": 550, "loss": 0.3475, "lr": 3.305407289332279e-05, "epoch": 2.990950226244344, "percentage": 60.0, "elapsed_time": "4:32:18", "remaining_time": "3:01:32"}
|
| 356 |
+
{"current_steps": 331, "total_steps": 550, "loss": 0.3429, "lr": 3.280420518524585e-05, "epoch": 3.002262443438914, "percentage": 60.18, "elapsed_time": "4:35:08", "remaining_time": "3:02:02"}
|
| 357 |
+
{"current_steps": 332, "total_steps": 550, "loss": 0.3276, "lr": 3.25546273227348e-05, "epoch": 3.01131221719457, "percentage": 60.36, "elapsed_time": "4:35:56", "remaining_time": "3:01:11"}
|
| 358 |
+
{"current_steps": 333, "total_steps": 550, "loss": 0.322, "lr": 3.230534935874958e-05, "epoch": 3.020361990950226, "percentage": 60.55, "elapsed_time": "4:36:44", "remaining_time": "3:00:20"}
|
| 359 |
+
{"current_steps": 334, "total_steps": 550, "loss": 0.3247, "lr": 3.205638133417019e-05, "epoch": 3.0294117647058822, "percentage": 60.73, "elapsed_time": "4:37:33", "remaining_time": "2:59:29"}
|