Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:810877517c86e89ac518723730218c5cafdad7b49ef14224b52ca929491b930e
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e13efec1d6c317d51e4467636d240f3f02e9ed66d4a165f3a9cac305a000787e
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:81e0d4db0bf04fa51c20dce007113d391b739aeffdc04cc9e4f23167d645c965
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7abe1929987bf5c812cc0b3297fc8a53a2c8cd565031ec482bd36ff899005fc7
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -260,3 +260,133 @@
|
|
| 260 |
{"current_steps": 260, "total_steps": 650, "loss": 0.4242, "lr": 3.0000000000000004e-05, "epoch": 1.9928195308760173, "percentage": 40.0, "elapsed_time": "7:34:33", "remaining_time": "11:21:50"}
|
| 261 |
{"current_steps": 261, "total_steps": 650, "loss": 0.6896, "lr": 2.990684089782507e-05, "epoch": 2.0019147917663953, "percentage": 40.15, "elapsed_time": "7:37:12", "remaining_time": "11:21:26"}
|
| 262 |
{"current_steps": 262, "total_steps": 650, "loss": 0.3589, "lr": 2.9813396087810134e-05, "epoch": 2.009573958831977, "percentage": 40.31, "elapsed_time": "7:38:51", "remaining_time": "11:19:32"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 260 |
{"current_steps": 260, "total_steps": 650, "loss": 0.4242, "lr": 3.0000000000000004e-05, "epoch": 1.9928195308760173, "percentage": 40.0, "elapsed_time": "7:34:33", "remaining_time": "11:21:50"}
|
| 261 |
{"current_steps": 261, "total_steps": 650, "loss": 0.6896, "lr": 2.990684089782507e-05, "epoch": 2.0019147917663953, "percentage": 40.15, "elapsed_time": "7:37:12", "remaining_time": "11:21:26"}
|
| 262 |
{"current_steps": 262, "total_steps": 650, "loss": 0.3589, "lr": 2.9813396087810134e-05, "epoch": 2.009573958831977, "percentage": 40.31, "elapsed_time": "7:38:51", "remaining_time": "11:19:32"}
|
| 263 |
+
{"current_steps": 263, "total_steps": 650, "loss": 0.3823, "lr": 2.971966826485212e-05, "epoch": 2.0172331258975587, "percentage": 40.46, "elapsed_time": "7:40:36", "remaining_time": "11:17:47"}
|
| 264 |
+
{"current_steps": 264, "total_steps": 650, "loss": 0.3751, "lr": 2.962566013200986e-05, "epoch": 2.0248922929631403, "percentage": 40.62, "elapsed_time": "7:42:25", "remaining_time": "11:16:07"}
|
| 265 |
+
{"current_steps": 265, "total_steps": 650, "loss": 0.3232, "lr": 2.9531374400426158e-05, "epoch": 2.032551460028722, "percentage": 40.77, "elapsed_time": "7:44:17", "remaining_time": "11:14:32"}
|
| 266 |
+
{"current_steps": 266, "total_steps": 650, "loss": 0.3447, "lr": 2.943681378924964e-05, "epoch": 2.0402106270943037, "percentage": 40.92, "elapsed_time": "7:46:06", "remaining_time": "11:12:52"}
|
| 267 |
+
{"current_steps": 267, "total_steps": 650, "loss": 0.3502, "lr": 2.934198102555631e-05, "epoch": 2.047869794159885, "percentage": 41.08, "elapsed_time": "7:47:58", "remaining_time": "11:11:16"}
|
| 268 |
+
{"current_steps": 268, "total_steps": 650, "loss": 0.3328, "lr": 2.924687884427087e-05, "epoch": 2.0555289612254666, "percentage": 41.23, "elapsed_time": "7:49:56", "remaining_time": "11:09:50"}
|
| 269 |
+
{"current_steps": 269, "total_steps": 650, "loss": 0.323, "lr": 2.9151509988087912e-05, "epoch": 2.0631881282910483, "percentage": 41.38, "elapsed_time": "7:51:32", "remaining_time": "11:07:51"}
|
| 270 |
+
{"current_steps": 270, "total_steps": 650, "loss": 0.3314, "lr": 2.9055877207392752e-05, "epoch": 2.07084729535663, "percentage": 41.54, "elapsed_time": "7:52:58", "remaining_time": "11:05:40"}
|
| 271 |
+
{"current_steps": 271, "total_steps": 650, "loss": 0.3433, "lr": 2.8959983260182166e-05, "epoch": 2.0785064624222116, "percentage": 41.69, "elapsed_time": "7:54:44", "remaining_time": "11:03:56"}
|
| 272 |
+
{"current_steps": 272, "total_steps": 650, "loss": 0.3174, "lr": 2.886383091198483e-05, "epoch": 2.0861656294877933, "percentage": 41.85, "elapsed_time": "7:56:15", "remaining_time": "11:01:51"}
|
| 273 |
+
{"current_steps": 273, "total_steps": 650, "loss": 0.4027, "lr": 2.876742293578155e-05, "epoch": 2.093824796553375, "percentage": 42.0, "elapsed_time": "7:58:02", "remaining_time": "11:00:08"}
|
| 274 |
+
{"current_steps": 274, "total_steps": 650, "loss": 0.3762, "lr": 2.8670762111925313e-05, "epoch": 2.1014839636189566, "percentage": 42.15, "elapsed_time": "7:59:39", "remaining_time": "10:58:12"}
|
| 275 |
+
{"current_steps": 275, "total_steps": 650, "loss": 0.3116, "lr": 2.8573851228061084e-05, "epoch": 2.109143130684538, "percentage": 42.31, "elapsed_time": "8:01:19", "remaining_time": "10:56:21"}
|
| 276 |
+
{"current_steps": 276, "total_steps": 650, "loss": 0.3379, "lr": 2.8476693079045432e-05, "epoch": 2.1168022977501195, "percentage": 42.46, "elapsed_time": "8:03:18", "remaining_time": "10:54:55"}
|
| 277 |
+
{"current_steps": 277, "total_steps": 650, "loss": 0.3305, "lr": 2.8379290466865906e-05, "epoch": 2.124461464815701, "percentage": 42.62, "elapsed_time": "8:04:56", "remaining_time": "10:52:59"}
|
| 278 |
+
{"current_steps": 278, "total_steps": 650, "loss": 0.3598, "lr": 2.828164620056024e-05, "epoch": 2.132120631881283, "percentage": 42.77, "elapsed_time": "8:06:32", "remaining_time": "10:51:03"}
|
| 279 |
+
{"current_steps": 279, "total_steps": 650, "loss": 0.302, "lr": 2.818376309613535e-05, "epoch": 2.1397797989468645, "percentage": 42.92, "elapsed_time": "8:08:15", "remaining_time": "10:49:15"}
|
| 280 |
+
{"current_steps": 280, "total_steps": 650, "loss": 0.3686, "lr": 2.80856439764861e-05, "epoch": 2.147438966012446, "percentage": 43.08, "elapsed_time": "8:09:59", "remaining_time": "10:47:29"}
|
| 281 |
+
{"current_steps": 281, "total_steps": 650, "loss": 0.3526, "lr": 2.798729167131391e-05, "epoch": 2.155098133078028, "percentage": 43.23, "elapsed_time": "8:11:28", "remaining_time": "10:45:22"}
|
| 282 |
+
{"current_steps": 282, "total_steps": 650, "loss": 0.3326, "lr": 2.7888709017045146e-05, "epoch": 2.1627573001436096, "percentage": 43.38, "elapsed_time": "8:13:22", "remaining_time": "10:43:49"}
|
| 283 |
+
{"current_steps": 283, "total_steps": 650, "loss": 0.3342, "lr": 2.7789898856749297e-05, "epoch": 2.170416467209191, "percentage": 43.54, "elapsed_time": "8:15:14", "remaining_time": "10:42:14"}
|
| 284 |
+
{"current_steps": 284, "total_steps": 650, "loss": 0.3051, "lr": 2.7690864040057023e-05, "epoch": 2.1780756342747725, "percentage": 43.69, "elapsed_time": "8:16:39", "remaining_time": "10:40:03"}
|
| 285 |
+
{"current_steps": 285, "total_steps": 650, "loss": 0.3087, "lr": 2.7591607423077932e-05, "epoch": 2.185734801340354, "percentage": 43.85, "elapsed_time": "8:18:14", "remaining_time": "10:38:06"}
|
| 286 |
+
{"current_steps": 286, "total_steps": 650, "loss": 0.3503, "lr": 2.7492131868318247e-05, "epoch": 2.193393968405936, "percentage": 44.0, "elapsed_time": "8:20:09", "remaining_time": "10:36:33"}
|
| 287 |
+
{"current_steps": 287, "total_steps": 650, "loss": 0.3654, "lr": 2.739244024459822e-05, "epoch": 2.2010531354715175, "percentage": 44.15, "elapsed_time": "8:22:04", "remaining_time": "10:35:01"}
|
| 288 |
+
{"current_steps": 288, "total_steps": 650, "loss": 0.3149, "lr": 2.7292535426969436e-05, "epoch": 2.208712302537099, "percentage": 44.31, "elapsed_time": "8:23:54", "remaining_time": "10:33:23"}
|
| 289 |
+
{"current_steps": 289, "total_steps": 650, "loss": 0.3911, "lr": 2.7192420296631835e-05, "epoch": 2.216371469602681, "percentage": 44.46, "elapsed_time": "8:25:44", "remaining_time": "10:31:43"}
|
| 290 |
+
{"current_steps": 290, "total_steps": 650, "loss": 0.3068, "lr": 2.7092097740850712e-05, "epoch": 2.2240306366682625, "percentage": 44.62, "elapsed_time": "8:27:13", "remaining_time": "10:29:39"}
|
| 291 |
+
{"current_steps": 291, "total_steps": 650, "loss": 0.3681, "lr": 2.6991570652873357e-05, "epoch": 2.231689803733844, "percentage": 44.77, "elapsed_time": "8:29:08", "remaining_time": "10:28:07"}
|
| 292 |
+
{"current_steps": 292, "total_steps": 650, "loss": 0.3022, "lr": 2.6890841931845674e-05, "epoch": 2.2393489707994254, "percentage": 44.92, "elapsed_time": "8:30:31", "remaining_time": "10:25:55"}
|
| 293 |
+
{"current_steps": 293, "total_steps": 650, "loss": 0.359, "lr": 2.6789914482728546e-05, "epoch": 2.247008137865007, "percentage": 45.08, "elapsed_time": "8:32:17", "remaining_time": "10:24:11"}
|
| 294 |
+
{"current_steps": 294, "total_steps": 650, "loss": 0.3693, "lr": 2.6688791216214064e-05, "epoch": 2.2546673049305888, "percentage": 45.23, "elapsed_time": "8:34:16", "remaining_time": "10:22:43"}
|
| 295 |
+
{"current_steps": 295, "total_steps": 650, "loss": 0.32, "lr": 2.6587475048641596e-05, "epoch": 2.2623264719961704, "percentage": 45.38, "elapsed_time": "8:35:44", "remaining_time": "10:20:38"}
|
| 296 |
+
{"current_steps": 296, "total_steps": 650, "loss": 0.3726, "lr": 2.6485968901913658e-05, "epoch": 2.269985639061752, "percentage": 45.54, "elapsed_time": "8:37:26", "remaining_time": "10:18:49"}
|
| 297 |
+
{"current_steps": 297, "total_steps": 650, "loss": 0.3584, "lr": 2.6384275703411666e-05, "epoch": 2.2776448061273338, "percentage": 45.69, "elapsed_time": "8:38:58", "remaining_time": "10:16:49"}
|
| 298 |
+
{"current_steps": 298, "total_steps": 650, "loss": 0.3263, "lr": 2.6282398385911503e-05, "epoch": 2.2853039731929154, "percentage": 45.85, "elapsed_time": "8:40:36", "remaining_time": "10:14:56"}
|
| 299 |
+
{"current_steps": 299, "total_steps": 650, "loss": 0.3854, "lr": 2.618033988749895e-05, "epoch": 2.2929631402584967, "percentage": 46.0, "elapsed_time": "8:42:49", "remaining_time": "10:13:45"}
|
| 300 |
+
{"current_steps": 300, "total_steps": 650, "loss": 0.3445, "lr": 2.607810315148494e-05, "epoch": 2.3006223073240784, "percentage": 46.15, "elapsed_time": "8:44:26", "remaining_time": "10:11:51"}
|
| 301 |
+
{"current_steps": 301, "total_steps": 650, "loss": 0.3486, "lr": 2.5975691126320678e-05, "epoch": 2.30828147438966, "percentage": 46.31, "elapsed_time": "8:46:13", "remaining_time": "10:10:08"}
|
| 302 |
+
{"current_steps": 302, "total_steps": 650, "loss": 0.3478, "lr": 2.587310676551262e-05, "epoch": 2.3159406414552417, "percentage": 46.46, "elapsed_time": "8:47:44", "remaining_time": "10:08:07"}
|
| 303 |
+
{"current_steps": 303, "total_steps": 650, "loss": 0.3494, "lr": 2.5770353027537276e-05, "epoch": 2.3235998085208234, "percentage": 46.62, "elapsed_time": "8:49:35", "remaining_time": "10:06:30"}
|
| 304 |
+
{"current_steps": 304, "total_steps": 650, "loss": 0.3267, "lr": 2.5667432875755904e-05, "epoch": 2.331258975586405, "percentage": 46.77, "elapsed_time": "8:51:10", "remaining_time": "10:04:33"}
|
| 305 |
+
{"current_steps": 305, "total_steps": 650, "loss": 0.3246, "lr": 2.5564349278329056e-05, "epoch": 2.3389181426519867, "percentage": 46.92, "elapsed_time": "8:52:44", "remaining_time": "10:02:36"}
|
| 306 |
+
{"current_steps": 306, "total_steps": 650, "loss": 0.2918, "lr": 2.5461105208130953e-05, "epoch": 2.3465773097175684, "percentage": 47.08, "elapsed_time": "8:54:12", "remaining_time": "10:00:32"}
|
| 307 |
+
{"current_steps": 307, "total_steps": 650, "loss": 0.357, "lr": 2.5357703642663766e-05, "epoch": 2.35423647678315, "percentage": 47.23, "elapsed_time": "8:55:59", "remaining_time": "9:58:50"}
|
| 308 |
+
{"current_steps": 308, "total_steps": 650, "loss": 0.3287, "lr": 2.525414756397174e-05, "epoch": 2.3618956438487313, "percentage": 47.38, "elapsed_time": "8:57:37", "remaining_time": "9:56:58"}
|
| 309 |
+
{"current_steps": 309, "total_steps": 650, "loss": 0.323, "lr": 2.5150439958555205e-05, "epoch": 2.369554810914313, "percentage": 47.54, "elapsed_time": "8:59:17", "remaining_time": "9:55:08"}
|
| 310 |
+
{"current_steps": 310, "total_steps": 650, "loss": 0.3641, "lr": 2.5046583817284437e-05, "epoch": 2.3772139779798946, "percentage": 47.69, "elapsed_time": "9:00:57", "remaining_time": "9:53:18"}
|
| 311 |
+
{"current_steps": 311, "total_steps": 650, "loss": 0.3553, "lr": 2.4942582135313393e-05, "epoch": 2.3848731450454763, "percentage": 47.85, "elapsed_time": "9:02:44", "remaining_time": "9:51:36"}
|
| 312 |
+
{"current_steps": 312, "total_steps": 650, "loss": 0.3455, "lr": 2.4838437911993355e-05, "epoch": 2.392532312111058, "percentage": 48.0, "elapsed_time": "9:04:44", "remaining_time": "9:50:08"}
|
| 313 |
+
{"current_steps": 313, "total_steps": 650, "loss": 0.3619, "lr": 2.473415415078642e-05, "epoch": 2.4001914791766397, "percentage": 48.15, "elapsed_time": "9:06:40", "remaining_time": "9:48:35"}
|
| 314 |
+
{"current_steps": 314, "total_steps": 650, "loss": 0.3485, "lr": 2.4629733859178867e-05, "epoch": 2.4078506462422213, "percentage": 48.31, "elapsed_time": "9:08:20", "remaining_time": "9:46:45"}
|
| 315 |
+
{"current_steps": 315, "total_steps": 650, "loss": 0.3057, "lr": 2.4525180048594452e-05, "epoch": 2.4155098133078026, "percentage": 48.46, "elapsed_time": "9:10:04", "remaining_time": "9:45:00"}
|
| 316 |
+
{"current_steps": 316, "total_steps": 650, "loss": 0.3747, "lr": 2.4420495734307527e-05, "epoch": 2.4231689803733842, "percentage": 48.62, "elapsed_time": "9:11:58", "remaining_time": "9:43:24"}
|
| 317 |
+
{"current_steps": 317, "total_steps": 650, "loss": 0.3475, "lr": 2.4315683935356127e-05, "epoch": 2.430828147438966, "percentage": 48.77, "elapsed_time": "9:13:44", "remaining_time": "9:41:41"}
|
| 318 |
+
{"current_steps": 318, "total_steps": 650, "loss": 0.303, "lr": 2.421074767445485e-05, "epoch": 2.4384873145045476, "percentage": 48.92, "elapsed_time": "9:15:26", "remaining_time": "9:39:53"}
|
| 319 |
+
{"current_steps": 319, "total_steps": 650, "loss": 0.3979, "lr": 2.4105689977907722e-05, "epoch": 2.4461464815701293, "percentage": 49.08, "elapsed_time": "9:17:24", "remaining_time": "9:38:22"}
|
| 320 |
+
{"current_steps": 320, "total_steps": 650, "loss": 0.3407, "lr": 2.4000513875520892e-05, "epoch": 2.453805648635711, "percentage": 49.23, "elapsed_time": "9:19:04", "remaining_time": "9:36:32"}
|
| 321 |
+
{"current_steps": 321, "total_steps": 650, "loss": 0.3425, "lr": 2.3895222400515282e-05, "epoch": 2.4614648157012926, "percentage": 49.38, "elapsed_time": "9:20:34", "remaining_time": "9:34:33"}
|
| 322 |
+
{"current_steps": 322, "total_steps": 650, "loss": 0.3098, "lr": 2.3789818589439094e-05, "epoch": 2.4691239827668743, "percentage": 49.54, "elapsed_time": "9:22:23", "remaining_time": "9:32:52"}
|
| 323 |
+
{"current_steps": 323, "total_steps": 650, "loss": 0.3591, "lr": 2.3684305482080233e-05, "epoch": 2.476783149832456, "percentage": 49.69, "elapsed_time": "9:24:25", "remaining_time": "9:31:24"}
|
| 324 |
+
{"current_steps": 324, "total_steps": 650, "loss": 0.3773, "lr": 2.357868612137866e-05, "epoch": 2.484442316898037, "percentage": 49.85, "elapsed_time": "9:26:04", "remaining_time": "9:29:34"}
|
| 325 |
+
{"current_steps": 325, "total_steps": 650, "loss": 0.3228, "lr": 2.3472963553338614e-05, "epoch": 2.492101483963619, "percentage": 50.0, "elapsed_time": "9:27:51", "remaining_time": "9:27:51"}
|
| 326 |
+
{"current_steps": 326, "total_steps": 650, "loss": 0.3546, "lr": 2.3367140826940768e-05, "epoch": 2.4997606510292005, "percentage": 50.15, "elapsed_time": "9:29:33", "remaining_time": "9:26:03"}
|
| 327 |
+
{"current_steps": 327, "total_steps": 650, "loss": 0.3375, "lr": 2.326122099405435e-05, "epoch": 2.507419818094782, "percentage": 50.31, "elapsed_time": "9:31:36", "remaining_time": "9:24:36"}
|
| 328 |
+
{"current_steps": 328, "total_steps": 650, "loss": 0.3687, "lr": 2.315520710934903e-05, "epoch": 2.515078985160364, "percentage": 50.46, "elapsed_time": "9:33:24", "remaining_time": "9:22:55"}
|
| 329 |
+
{"current_steps": 329, "total_steps": 650, "loss": 0.3548, "lr": 2.304910223020691e-05, "epoch": 2.5227381522259456, "percentage": 50.62, "elapsed_time": "9:35:12", "remaining_time": "9:21:13"}
|
| 330 |
+
{"current_steps": 330, "total_steps": 650, "loss": 0.3446, "lr": 2.2942909416634326e-05, "epoch": 2.5303973192915272, "percentage": 50.77, "elapsed_time": "9:37:02", "remaining_time": "9:19:33"}
|
| 331 |
+
{"current_steps": 331, "total_steps": 650, "loss": 0.3281, "lr": 2.2836631731173577e-05, "epoch": 2.5380564863571085, "percentage": 50.92, "elapsed_time": "9:38:54", "remaining_time": "9:17:55"}
|
| 332 |
+
{"current_steps": 332, "total_steps": 650, "loss": 0.3479, "lr": 2.2730272238814636e-05, "epoch": 2.54571565342269, "percentage": 51.08, "elapsed_time": "9:40:26", "remaining_time": "9:15:57"}
|
| 333 |
+
{"current_steps": 333, "total_steps": 650, "loss": 0.3468, "lr": 2.2623834006906732e-05, "epoch": 2.553374820488272, "percentage": 51.23, "elapsed_time": "9:42:07", "remaining_time": "9:14:09"}
|
| 334 |
+
{"current_steps": 334, "total_steps": 650, "loss": 0.311, "lr": 2.25173201050699e-05, "epoch": 2.5610339875538535, "percentage": 51.38, "elapsed_time": "9:43:38", "remaining_time": "9:12:11"}
|
| 335 |
+
{"current_steps": 335, "total_steps": 650, "loss": 0.3803, "lr": 2.2410733605106462e-05, "epoch": 2.568693154619435, "percentage": 51.54, "elapsed_time": "9:45:31", "remaining_time": "9:10:34"}
|
| 336 |
+
{"current_steps": 336, "total_steps": 650, "loss": 0.2936, "lr": 2.2304077580912423e-05, "epoch": 2.576352321685017, "percentage": 51.69, "elapsed_time": "9:47:13", "remaining_time": "9:08:46"}
|
| 337 |
+
{"current_steps": 337, "total_steps": 650, "loss": 0.3184, "lr": 2.2197355108388835e-05, "epoch": 2.5840114887505985, "percentage": 51.85, "elapsed_time": "9:48:50", "remaining_time": "9:06:54"}
|
| 338 |
+
{"current_steps": 338, "total_steps": 650, "loss": 0.3287, "lr": 2.209056926535307e-05, "epoch": 2.5916706558161797, "percentage": 52.0, "elapsed_time": "9:50:42", "remaining_time": "9:05:16"}
|
| 339 |
+
{"current_steps": 339, "total_steps": 650, "loss": 0.3683, "lr": 2.1983723131450088e-05, "epoch": 2.599329822881762, "percentage": 52.15, "elapsed_time": "9:52:40", "remaining_time": "9:03:43"}
|
| 340 |
+
{"current_steps": 340, "total_steps": 650, "loss": 0.3086, "lr": 2.1876819788063586e-05, "epoch": 2.606988989947343, "percentage": 52.31, "elapsed_time": "9:54:21", "remaining_time": "9:01:54"}
|
| 341 |
+
{"current_steps": 341, "total_steps": 650, "loss": 0.375, "lr": 2.176986231822717e-05, "epoch": 2.6146481570129247, "percentage": 52.46, "elapsed_time": "9:56:07", "remaining_time": "9:00:10"}
|
| 342 |
+
{"current_steps": 342, "total_steps": 650, "loss": 0.3432, "lr": 2.166285380653541e-05, "epoch": 2.6223073240785064, "percentage": 52.62, "elapsed_time": "9:58:02", "remaining_time": "8:58:34"}
|
| 343 |
+
{"current_steps": 343, "total_steps": 650, "loss": 0.3207, "lr": 2.1555797339054898e-05, "epoch": 2.629966491144088, "percentage": 52.77, "elapsed_time": "9:59:55", "remaining_time": "8:56:57"}
|
| 344 |
+
{"current_steps": 344, "total_steps": 650, "loss": 0.3586, "lr": 2.1448696003235252e-05, "epoch": 2.6376256582096698, "percentage": 52.92, "elapsed_time": "10:01:49", "remaining_time": "8:55:20"}
|
| 345 |
+
{"current_steps": 345, "total_steps": 650, "loss": 0.3419, "lr": 2.1341552887820048e-05, "epoch": 2.6452848252752514, "percentage": 53.08, "elapsed_time": "10:03:14", "remaining_time": "8:53:18"}
|
| 346 |
+
{"current_steps": 346, "total_steps": 650, "loss": 0.3605, "lr": 2.123437108275779e-05, "epoch": 2.652943992340833, "percentage": 53.23, "elapsed_time": "10:04:58", "remaining_time": "8:51:32"}
|
| 347 |
+
{"current_steps": 347, "total_steps": 650, "loss": 0.3102, "lr": 2.112715367911275e-05, "epoch": 2.6606031594064143, "percentage": 53.38, "elapsed_time": "10:06:16", "remaining_time": "8:49:24"}
|
| 348 |
+
{"current_steps": 348, "total_steps": 650, "loss": 0.3645, "lr": 2.1019903768975852e-05, "epoch": 2.668262326471996, "percentage": 53.54, "elapsed_time": "10:08:03", "remaining_time": "8:47:40"}
|
| 349 |
+
{"current_steps": 349, "total_steps": 650, "loss": 0.3641, "lr": 2.0912624445375483e-05, "epoch": 2.6759214935375777, "percentage": 53.69, "elapsed_time": "10:09:39", "remaining_time": "8:45:48"}
|
| 350 |
+
{"current_steps": 350, "total_steps": 650, "loss": 0.3233, "lr": 2.0805318802188307e-05, "epoch": 2.6835806606031594, "percentage": 53.85, "elapsed_time": "10:11:43", "remaining_time": "8:44:19"}
|
| 351 |
+
{"current_steps": 351, "total_steps": 650, "loss": 0.3492, "lr": 2.0697989934050025e-05, "epoch": 2.691239827668741, "percentage": 54.0, "elapsed_time": "10:13:18", "remaining_time": "8:42:26"}
|
| 352 |
+
{"current_steps": 352, "total_steps": 650, "loss": 0.3492, "lr": 2.0590640936266132e-05, "epoch": 2.6988989947343227, "percentage": 54.15, "elapsed_time": "10:14:53", "remaining_time": "8:40:33"}
|
| 353 |
+
{"current_steps": 353, "total_steps": 650, "loss": 0.3478, "lr": 2.0483274904722647e-05, "epoch": 2.7065581617999044, "percentage": 54.31, "elapsed_time": "10:16:46", "remaining_time": "8:38:56"}
|
| 354 |
+
{"current_steps": 354, "total_steps": 650, "loss": 0.3553, "lr": 2.037589493579685e-05, "epoch": 2.7142173288654856, "percentage": 54.46, "elapsed_time": "10:18:35", "remaining_time": "8:37:14"}
|
| 355 |
+
{"current_steps": 355, "total_steps": 650, "loss": 0.3653, "lr": 2.0268504126267952e-05, "epoch": 2.7218764959310677, "percentage": 54.62, "elapsed_time": "10:20:20", "remaining_time": "8:35:29"}
|
| 356 |
+
{"current_steps": 356, "total_steps": 650, "loss": 0.36, "lr": 2.0161105573227798e-05, "epoch": 2.729535662996649, "percentage": 54.77, "elapsed_time": "10:22:05", "remaining_time": "8:33:44"}
|
| 357 |
+
{"current_steps": 357, "total_steps": 650, "loss": 0.3515, "lr": 2.005370237399157e-05, "epoch": 2.7371948300622306, "percentage": 54.92, "elapsed_time": "10:23:46", "remaining_time": "8:31:57"}
|
| 358 |
+
{"current_steps": 358, "total_steps": 650, "loss": 0.2689, "lr": 1.9946297626008432e-05, "epoch": 2.7448539971278123, "percentage": 55.08, "elapsed_time": "10:24:57", "remaining_time": "8:29:44"}
|
| 359 |
+
{"current_steps": 359, "total_steps": 650, "loss": 0.3706, "lr": 1.9838894426772205e-05, "epoch": 2.752513164193394, "percentage": 55.23, "elapsed_time": "10:26:35", "remaining_time": "8:27:54"}
|
| 360 |
+
{"current_steps": 360, "total_steps": 650, "loss": 0.3135, "lr": 1.9731495873732055e-05, "epoch": 2.7601723312589757, "percentage": 55.38, "elapsed_time": "10:28:37", "remaining_time": "8:26:23"}
|
| 361 |
+
{"current_steps": 361, "total_steps": 650, "loss": 0.3576, "lr": 1.9624105064203157e-05, "epoch": 2.7678314983245573, "percentage": 55.54, "elapsed_time": "10:30:47", "remaining_time": "8:24:58"}
|
| 362 |
+
{"current_steps": 362, "total_steps": 650, "loss": 0.3321, "lr": 1.951672509527736e-05, "epoch": 2.775490665390139, "percentage": 55.69, "elapsed_time": "10:32:41", "remaining_time": "8:23:21"}
|
| 363 |
+
{"current_steps": 363, "total_steps": 650, "loss": 0.3715, "lr": 1.940935906373388e-05, "epoch": 2.7831498324557202, "percentage": 55.85, "elapsed_time": "10:34:27", "remaining_time": "8:21:37"}
|
| 364 |
+
{"current_steps": 364, "total_steps": 650, "loss": 0.3412, "lr": 1.930201006594999e-05, "epoch": 2.790808999521302, "percentage": 56.0, "elapsed_time": "10:36:14", "remaining_time": "8:19:54"}
|
| 365 |
+
{"current_steps": 365, "total_steps": 650, "loss": 0.3849, "lr": 1.9194681197811703e-05, "epoch": 2.7984681665868836, "percentage": 56.15, "elapsed_time": "10:38:06", "remaining_time": "8:18:14"}
|
| 366 |
+
{"current_steps": 366, "total_steps": 650, "loss": 0.3072, "lr": 1.9087375554624527e-05, "epoch": 2.8061273336524652, "percentage": 56.31, "elapsed_time": "10:39:53", "remaining_time": "8:16:31"}
|
| 367 |
+
{"current_steps": 367, "total_steps": 650, "loss": 0.3261, "lr": 1.898009623102415e-05, "epoch": 2.813786500718047, "percentage": 56.46, "elapsed_time": "10:41:32", "remaining_time": "8:14:42"}
|
| 368 |
+
{"current_steps": 368, "total_steps": 650, "loss": 0.4029, "lr": 1.887284632088725e-05, "epoch": 2.8214456677836286, "percentage": 56.62, "elapsed_time": "10:43:27", "remaining_time": "8:13:05"}
|
| 369 |
+
{"current_steps": 369, "total_steps": 650, "loss": 0.3588, "lr": 1.8765628917242213e-05, "epoch": 2.8291048348492103, "percentage": 56.77, "elapsed_time": "10:45:10", "remaining_time": "8:11:18"}
|
| 370 |
+
{"current_steps": 370, "total_steps": 650, "loss": 0.3039, "lr": 1.8658447112179952e-05, "epoch": 2.8367640019147915, "percentage": 56.92, "elapsed_time": "10:47:00", "remaining_time": "8:09:37"}
|
| 371 |
+
{"current_steps": 371, "total_steps": 650, "loss": 0.3836, "lr": 1.8551303996764755e-05, "epoch": 2.8444231689803736, "percentage": 57.08, "elapsed_time": "10:49:02", "remaining_time": "8:08:05"}
|
| 372 |
+
{"current_steps": 372, "total_steps": 650, "loss": 0.3679, "lr": 1.8444202660945105e-05, "epoch": 2.852082336045955, "percentage": 57.23, "elapsed_time": "10:50:54", "remaining_time": "8:06:26"}
|
| 373 |
+
{"current_steps": 373, "total_steps": 650, "loss": 0.288, "lr": 1.8337146193464595e-05, "epoch": 2.8597415031115365, "percentage": 57.38, "elapsed_time": "10:52:18", "remaining_time": "8:04:25"}
|
| 374 |
+
{"current_steps": 374, "total_steps": 650, "loss": 0.3741, "lr": 1.8230137681772836e-05, "epoch": 2.867400670177118, "percentage": 57.54, "elapsed_time": "10:54:26", "remaining_time": "8:02:57"}
|
| 375 |
+
{"current_steps": 375, "total_steps": 650, "loss": 0.3425, "lr": 1.8123180211936417e-05, "epoch": 2.8750598372427, "percentage": 57.69, "elapsed_time": "10:56:13", "remaining_time": "8:01:13"}
|
| 376 |
+
{"current_steps": 376, "total_steps": 650, "loss": 0.3436, "lr": 1.801627686854992e-05, "epoch": 2.8827190043082815, "percentage": 57.85, "elapsed_time": "10:57:39", "remaining_time": "7:59:15"}
|
| 377 |
+
{"current_steps": 377, "total_steps": 650, "loss": 0.3142, "lr": 1.7909430734646936e-05, "epoch": 2.890378171373863, "percentage": 58.0, "elapsed_time": "10:59:29", "remaining_time": "7:57:34"}
|
| 378 |
+
{"current_steps": 378, "total_steps": 650, "loss": 0.327, "lr": 1.780264489161117e-05, "epoch": 2.898037338439445, "percentage": 58.15, "elapsed_time": "11:01:05", "remaining_time": "7:55:42"}
|
| 379 |
+
{"current_steps": 379, "total_steps": 650, "loss": 0.3469, "lr": 1.769592241908758e-05, "epoch": 2.905696505505026, "percentage": 58.31, "elapsed_time": "11:03:00", "remaining_time": "7:54:04"}
|
| 380 |
+
{"current_steps": 380, "total_steps": 650, "loss": 0.398, "lr": 1.758926639489354e-05, "epoch": 2.913355672570608, "percentage": 58.46, "elapsed_time": "11:04:57", "remaining_time": "7:52:28"}
|
| 381 |
+
{"current_steps": 381, "total_steps": 650, "loss": 0.3077, "lr": 1.748267989493011e-05, "epoch": 2.9210148396361895, "percentage": 58.62, "elapsed_time": "11:06:54", "remaining_time": "7:50:51"}
|
| 382 |
+
{"current_steps": 382, "total_steps": 650, "loss": 0.3791, "lr": 1.7376165993093278e-05, "epoch": 2.928674006701771, "percentage": 58.77, "elapsed_time": "11:08:34", "remaining_time": "7:49:03"}
|
| 383 |
+
{"current_steps": 383, "total_steps": 650, "loss": 0.3203, "lr": 1.7269727761185374e-05, "epoch": 2.936333173767353, "percentage": 58.92, "elapsed_time": "11:10:32", "remaining_time": "7:47:26"}
|
| 384 |
+
{"current_steps": 384, "total_steps": 650, "loss": 0.3247, "lr": 1.7163368268826433e-05, "epoch": 2.9439923408329345, "percentage": 59.08, "elapsed_time": "11:12:14", "remaining_time": "7:45:40"}
|
| 385 |
+
{"current_steps": 385, "total_steps": 650, "loss": 0.3714, "lr": 1.7057090583365678e-05, "epoch": 2.951651507898516, "percentage": 59.23, "elapsed_time": "11:14:05", "remaining_time": "7:43:59"}
|
| 386 |
+
{"current_steps": 386, "total_steps": 650, "loss": 0.2943, "lr": 1.6950897769793093e-05, "epoch": 2.9593106749640974, "percentage": 59.38, "elapsed_time": "11:15:46", "remaining_time": "7:42:11"}
|
| 387 |
+
{"current_steps": 387, "total_steps": 650, "loss": 0.3443, "lr": 1.6844792890650976e-05, "epoch": 2.9669698420296795, "percentage": 59.54, "elapsed_time": "11:17:19", "remaining_time": "7:40:17"}
|
| 388 |
+
{"current_steps": 388, "total_steps": 650, "loss": 0.3399, "lr": 1.673877900594566e-05, "epoch": 2.9746290090952607, "percentage": 59.69, "elapsed_time": "11:19:11", "remaining_time": "7:38:37"}
|
| 389 |
+
{"current_steps": 389, "total_steps": 650, "loss": 0.344, "lr": 1.6632859173059232e-05, "epoch": 2.9822881761608424, "percentage": 59.85, "elapsed_time": "11:20:55", "remaining_time": "7:36:52"}
|
| 390 |
+
{"current_steps": 390, "total_steps": 650, "loss": 0.3455, "lr": 1.6527036446661396e-05, "epoch": 2.989947343226424, "percentage": 60.0, "elapsed_time": "11:22:38", "remaining_time": "7:35:05"}
|
| 391 |
+
{"current_steps": 391, "total_steps": 650, "loss": 0.4699, "lr": 1.6421313878621344e-05, "epoch": 2.9976065102920058, "percentage": 60.15, "elapsed_time": "11:24:13", "remaining_time": "7:33:14"}
|
| 392 |
+
{"current_steps": 392, "total_steps": 650, "loss": 0.3313, "lr": 1.631569451791977e-05, "epoch": 3.006701771182384, "percentage": 60.31, "elapsed_time": "11:26:56", "remaining_time": "7:32:07"}
|