Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:665e7cd795a2e6acc9b9c978c4bd61aa0943374737e2ce4aa627d5aa63fbc8d2
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:01b737c1752008fa9ec44191dd01619a21f972a2b4c5f264c8ecc94cb3a31cf8
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e2d4ccc92b0a15c6609997da975423bea0a09f632fa43b15e4c134b9de58b869
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22ae210ab91b0a01b6c413cb5d6a5d022932a8d64508efdd57660037c1b68942
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -251,3 +251,85 @@
|
|
| 251 |
{"current_steps": 251, "total_steps": 1230, "loss": 0.5501, "lr": 3.869490061403091e-05, "epoch": 1.0167088607594936, "percentage": 20.41, "elapsed_time": "1:39:33", "remaining_time": "6:28:19"}
|
| 252 |
{"current_steps": 252, "total_steps": 1230, "loss": 0.5597, "lr": 3.867465791158124e-05, "epoch": 1.0207594936708861, "percentage": 20.49, "elapsed_time": "1:39:53", "remaining_time": "6:27:41"}
|
| 253 |
{"current_steps": 253, "total_steps": 1230, "loss": 0.5359, "lr": 3.865426480600407e-05, "epoch": 1.0248101265822784, "percentage": 20.57, "elapsed_time": "1:40:12", "remaining_time": "6:27:00"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 251 |
{"current_steps": 251, "total_steps": 1230, "loss": 0.5501, "lr": 3.869490061403091e-05, "epoch": 1.0167088607594936, "percentage": 20.41, "elapsed_time": "1:39:33", "remaining_time": "6:28:19"}
|
| 252 |
{"current_steps": 252, "total_steps": 1230, "loss": 0.5597, "lr": 3.867465791158124e-05, "epoch": 1.0207594936708861, "percentage": 20.49, "elapsed_time": "1:39:53", "remaining_time": "6:27:41"}
|
| 253 |
{"current_steps": 253, "total_steps": 1230, "loss": 0.5359, "lr": 3.865426480600407e-05, "epoch": 1.0248101265822784, "percentage": 20.57, "elapsed_time": "1:40:12", "remaining_time": "6:27:00"}
|
| 254 |
+
{"current_steps": 254, "total_steps": 1230, "loss": 0.5477, "lr": 3.863372146154264e-05, "epoch": 1.028860759493671, "percentage": 20.65, "elapsed_time": "1:40:35", "remaining_time": "6:26:33"}
|
| 255 |
+
{"current_steps": 255, "total_steps": 1230, "loss": 0.5569, "lr": 3.861302804365024e-05, "epoch": 1.0329113924050632, "percentage": 20.73, "elapsed_time": "1:41:02", "remaining_time": "6:26:19"}
|
| 256 |
+
{"current_steps": 256, "total_steps": 1230, "loss": 0.5782, "lr": 3.85921847189888e-05, "epoch": 1.0369620253164558, "percentage": 20.81, "elapsed_time": "1:41:26", "remaining_time": "6:25:58"}
|
| 257 |
+
{"current_steps": 257, "total_steps": 1230, "loss": 0.5787, "lr": 3.85711916554276e-05, "epoch": 1.041012658227848, "percentage": 20.89, "elapsed_time": "1:41:45", "remaining_time": "6:25:13"}
|
| 258 |
+
{"current_steps": 258, "total_steps": 1230, "loss": 0.5584, "lr": 3.85500490220419e-05, "epoch": 1.0450632911392406, "percentage": 20.98, "elapsed_time": "1:42:04", "remaining_time": "6:24:34"}
|
| 259 |
+
{"current_steps": 259, "total_steps": 1230, "loss": 0.5626, "lr": 3.852875698911154e-05, "epoch": 1.0491139240506329, "percentage": 21.06, "elapsed_time": "1:42:24", "remaining_time": "6:23:56"}
|
| 260 |
+
{"current_steps": 260, "total_steps": 1230, "loss": 0.5526, "lr": 3.850731572811963e-05, "epoch": 1.0531645569620254, "percentage": 21.14, "elapsed_time": "1:42:46", "remaining_time": "6:23:25"}
|
| 261 |
+
{"current_steps": 261, "total_steps": 1230, "loss": 0.5695, "lr": 3.848572541175116e-05, "epoch": 1.0572151898734177, "percentage": 21.22, "elapsed_time": "1:43:10", "remaining_time": "6:23:02"}
|
| 262 |
+
{"current_steps": 262, "total_steps": 1230, "loss": 0.5375, "lr": 3.846398621389154e-05, "epoch": 1.0612658227848102, "percentage": 21.3, "elapsed_time": "1:43:29", "remaining_time": "6:22:22"}
|
| 263 |
+
{"current_steps": 263, "total_steps": 1230, "loss": 0.5549, "lr": 3.84420983096253e-05, "epoch": 1.0653164556962025, "percentage": 21.38, "elapsed_time": "1:43:57", "remaining_time": "6:22:13"}
|
| 264 |
+
{"current_steps": 264, "total_steps": 1230, "loss": 0.5666, "lr": 3.8420061875234606e-05, "epoch": 1.069367088607595, "percentage": 21.46, "elapsed_time": "1:44:18", "remaining_time": "6:21:42"}
|
| 265 |
+
{"current_steps": 265, "total_steps": 1230, "loss": 0.5332, "lr": 3.839787708819787e-05, "epoch": 1.0734177215189873, "percentage": 21.54, "elapsed_time": "1:44:44", "remaining_time": "6:21:25"}
|
| 266 |
+
{"current_steps": 266, "total_steps": 1230, "loss": 0.5708, "lr": 3.8375544127188325e-05, "epoch": 1.0774683544303798, "percentage": 21.63, "elapsed_time": "1:45:07", "remaining_time": "6:20:57"}
|
| 267 |
+
{"current_steps": 267, "total_steps": 1230, "loss": 0.5611, "lr": 3.8353063172072564e-05, "epoch": 1.081518987341772, "percentage": 21.71, "elapsed_time": "1:45:27", "remaining_time": "6:20:21"}
|
| 268 |
+
{"current_steps": 268, "total_steps": 1230, "loss": 0.5642, "lr": 3.8330434403909105e-05, "epoch": 1.0855696202531646, "percentage": 21.79, "elapsed_time": "1:45:57", "remaining_time": "6:20:18"}
|
| 269 |
+
{"current_steps": 269, "total_steps": 1230, "loss": 0.5762, "lr": 3.8307658004946934e-05, "epoch": 1.089620253164557, "percentage": 21.87, "elapsed_time": "1:46:17", "remaining_time": "6:19:43"}
|
| 270 |
+
{"current_steps": 270, "total_steps": 1230, "loss": 0.5744, "lr": 3.8284734158624046e-05, "epoch": 1.0936708860759494, "percentage": 21.95, "elapsed_time": "1:46:40", "remaining_time": "6:19:17"}
|
| 271 |
+
{"current_steps": 271, "total_steps": 1230, "loss": 0.554, "lr": 3.826166304956594e-05, "epoch": 1.0977215189873417, "percentage": 22.03, "elapsed_time": "1:47:05", "remaining_time": "6:18:56"}
|
| 272 |
+
{"current_steps": 272, "total_steps": 1230, "loss": 0.5507, "lr": 3.8238444863584164e-05, "epoch": 1.1017721518987342, "percentage": 22.11, "elapsed_time": "1:47:31", "remaining_time": "6:18:41"}
|
| 273 |
+
{"current_steps": 273, "total_steps": 1230, "loss": 0.5363, "lr": 3.821507978767479e-05, "epoch": 1.1058227848101265, "percentage": 22.2, "elapsed_time": "1:47:53", "remaining_time": "6:18:12"}
|
| 274 |
+
{"current_steps": 274, "total_steps": 1230, "loss": 0.5678, "lr": 3.819156801001693e-05, "epoch": 1.109873417721519, "percentage": 22.28, "elapsed_time": "1:48:14", "remaining_time": "6:17:41"}
|
| 275 |
+
{"current_steps": 310, "total_steps": 1230, "loss": 0.5669, "lr": 3.7249124400767006e-05, "epoch": 1.2556962025316456, "percentage": 25.2, "elapsed_time": "2:02:00", "remaining_time": "6:02:05"}
|
| 276 |
+
{"current_steps": 311, "total_steps": 1230, "loss": 0.5533, "lr": 3.722032761533114e-05, "epoch": 1.259746835443038, "percentage": 25.28, "elapsed_time": "2:02:21", "remaining_time": "6:01:34"}
|
| 277 |
+
{"current_steps": 312, "total_steps": 1230, "loss": 0.5615, "lr": 3.719139213974403e-05, "epoch": 1.2637974683544304, "percentage": 25.37, "elapsed_time": "2:02:43", "remaining_time": "6:01:04"}
|
| 278 |
+
{"current_steps": 313, "total_steps": 1230, "loss": 0.5358, "lr": 3.7162318207048006e-05, "epoch": 1.2678481012658227, "percentage": 25.45, "elapsed_time": "2:03:06", "remaining_time": "6:00:39"}
|
| 279 |
+
{"current_steps": 314, "total_steps": 1230, "loss": 0.593, "lr": 3.713310605140055e-05, "epoch": 1.2718987341772152, "percentage": 25.53, "elapsed_time": "2:03:27", "remaining_time": "6:00:10"}
|
| 280 |
+
{"current_steps": 315, "total_steps": 1230, "loss": 0.5701, "lr": 3.710375590807233e-05, "epoch": 1.2759493670886077, "percentage": 25.61, "elapsed_time": "2:03:55", "remaining_time": "5:59:59"}
|
| 281 |
+
{"current_steps": 316, "total_steps": 1230, "loss": 0.5896, "lr": 3.7074268013445365e-05, "epoch": 1.28, "percentage": 25.69, "elapsed_time": "2:04:13", "remaining_time": "5:59:17"}
|
| 282 |
+
{"current_steps": 317, "total_steps": 1230, "loss": 0.5549, "lr": 3.7044642605011114e-05, "epoch": 1.2840506329113923, "percentage": 25.77, "elapsed_time": "2:04:37", "remaining_time": "5:58:55"}
|
| 283 |
+
{"current_steps": 318, "total_steps": 1230, "loss": 0.567, "lr": 3.701487992136854e-05, "epoch": 1.2881012658227848, "percentage": 25.85, "elapsed_time": "2:05:01", "remaining_time": "5:58:32"}
|
| 284 |
+
{"current_steps": 319, "total_steps": 1230, "loss": 0.5862, "lr": 3.69849802022222e-05, "epoch": 1.2921518987341774, "percentage": 25.93, "elapsed_time": "2:05:28", "remaining_time": "5:58:19"}
|
| 285 |
+
{"current_steps": 320, "total_steps": 1230, "loss": 0.5813, "lr": 3.6954943688380334e-05, "epoch": 1.2962025316455696, "percentage": 26.02, "elapsed_time": "2:05:47", "remaining_time": "5:57:43"}
|
| 286 |
+
{"current_steps": 321, "total_steps": 1230, "loss": 0.5514, "lr": 3.692477062175289e-05, "epoch": 1.300253164556962, "percentage": 26.1, "elapsed_time": "2:06:11", "remaining_time": "5:57:21"}
|
| 287 |
+
{"current_steps": 322, "total_steps": 1230, "loss": 0.5592, "lr": 3.689446124534958e-05, "epoch": 1.3043037974683545, "percentage": 26.18, "elapsed_time": "2:06:37", "remaining_time": "5:57:03"}
|
| 288 |
+
{"current_steps": 323, "total_steps": 1230, "loss": 0.5752, "lr": 3.686401580327799e-05, "epoch": 1.308354430379747, "percentage": 26.26, "elapsed_time": "2:06:55", "remaining_time": "5:56:25"}
|
| 289 |
+
{"current_steps": 324, "total_steps": 1230, "loss": 0.5804, "lr": 3.683343454074149e-05, "epoch": 1.3124050632911393, "percentage": 26.34, "elapsed_time": "2:07:17", "remaining_time": "5:55:56"}
|
| 290 |
+
{"current_steps": 325, "total_steps": 1230, "loss": 0.5479, "lr": 3.6802717704037386e-05, "epoch": 1.3164556962025316, "percentage": 26.42, "elapsed_time": "2:07:43", "remaining_time": "5:55:39"}
|
| 291 |
+
{"current_steps": 326, "total_steps": 1230, "loss": 0.5588, "lr": 3.6771865540554855e-05, "epoch": 1.320506329113924, "percentage": 26.5, "elapsed_time": "2:08:10", "remaining_time": "5:55:26"}
|
| 292 |
+
{"current_steps": 327, "total_steps": 1230, "loss": 0.5391, "lr": 3.674087829877297e-05, "epoch": 1.3245569620253166, "percentage": 26.59, "elapsed_time": "2:08:33", "remaining_time": "5:54:59"}
|
| 293 |
+
{"current_steps": 328, "total_steps": 1230, "loss": 0.5729, "lr": 3.6709756228258735e-05, "epoch": 1.3286075949367089, "percentage": 26.67, "elapsed_time": "2:08:54", "remaining_time": "5:54:30"}
|
| 294 |
+
{"current_steps": 329, "total_steps": 1230, "loss": 0.5677, "lr": 3.667849957966501e-05, "epoch": 1.3326582278481012, "percentage": 26.75, "elapsed_time": "2:09:15", "remaining_time": "5:53:58"}
|
| 295 |
+
{"current_steps": 330, "total_steps": 1230, "loss": 0.5784, "lr": 3.6647108604728546e-05, "epoch": 1.3367088607594937, "percentage": 26.83, "elapsed_time": "2:09:46", "remaining_time": "5:53:55"}
|
| 296 |
+
{"current_steps": 461, "total_steps": 1230, "loss": 0.5499, "lr": 3.148314933498886e-05, "epoch": 1.8673417721518988, "percentage": 37.48, "elapsed_time": "3:01:03", "remaining_time": "5:02:01"}
|
| 297 |
+
{"current_steps": 462, "total_steps": 1230, "loss": 0.5553, "lr": 3.143663228021431e-05, "epoch": 1.871392405063291, "percentage": 37.56, "elapsed_time": "3:01:28", "remaining_time": "5:01:40"}
|
| 298 |
+
{"current_steps": 463, "total_steps": 1230, "loss": 0.5592, "lr": 3.1390023116375624e-05, "epoch": 1.8754430379746836, "percentage": 37.64, "elapsed_time": "3:01:51", "remaining_time": "5:01:15"}
|
| 299 |
+
{"current_steps": 464, "total_steps": 1230, "loss": 0.5724, "lr": 3.134332221885661e-05, "epoch": 1.879493670886076, "percentage": 37.72, "elapsed_time": "3:02:13", "remaining_time": "5:00:49"}
|
| 300 |
+
{"current_steps": 465, "total_steps": 1230, "loss": 0.5637, "lr": 3.129652996377987e-05, "epoch": 1.8835443037974684, "percentage": 37.8, "elapsed_time": "3:02:35", "remaining_time": "5:00:24"}
|
| 301 |
+
{"current_steps": 466, "total_steps": 1230, "loss": 0.5746, "lr": 3.12496467280038e-05, "epoch": 1.8875949367088607, "percentage": 37.89, "elapsed_time": "3:02:57", "remaining_time": "4:59:57"}
|
| 302 |
+
{"current_steps": 467, "total_steps": 1230, "loss": 0.5701, "lr": 3.120267288911952e-05, "epoch": 1.8916455696202532, "percentage": 37.97, "elapsed_time": "3:03:17", "remaining_time": "4:59:28"}
|
| 303 |
+
{"current_steps": 468, "total_steps": 1230, "loss": 0.5667, "lr": 3.11556088254479e-05, "epoch": 1.8956962025316457, "percentage": 38.05, "elapsed_time": "3:03:43", "remaining_time": "4:59:08"}
|
| 304 |
+
{"current_steps": 469, "total_steps": 1230, "loss": 0.5401, "lr": 3.11084549160364e-05, "epoch": 1.899746835443038, "percentage": 38.13, "elapsed_time": "3:04:11", "remaining_time": "4:58:52"}
|
| 305 |
+
{"current_steps": 470, "total_steps": 1230, "loss": 0.5693, "lr": 3.106121154065615e-05, "epoch": 1.9037974683544303, "percentage": 38.21, "elapsed_time": "3:04:31", "remaining_time": "4:58:23"}
|
| 306 |
+
{"current_steps": 471, "total_steps": 1230, "loss": 0.5489, "lr": 3.1013879079798805e-05, "epoch": 1.9078481012658228, "percentage": 38.29, "elapsed_time": "3:04:55", "remaining_time": "4:57:59"}
|
| 307 |
+
{"current_steps": 472, "total_steps": 1230, "loss": 0.5933, "lr": 3.096645791467348e-05, "epoch": 1.9118987341772153, "percentage": 38.37, "elapsed_time": "3:05:12", "remaining_time": "4:57:26"}
|
| 308 |
+
{"current_steps": 473, "total_steps": 1230, "loss": 0.5819, "lr": 3.091894842720373e-05, "epoch": 1.9159493670886076, "percentage": 38.46, "elapsed_time": "3:05:38", "remaining_time": "4:57:05"}
|
| 309 |
+
{"current_steps": 474, "total_steps": 1230, "loss": 0.5792, "lr": 3.0871351000024425e-05, "epoch": 1.92, "percentage": 38.54, "elapsed_time": "3:06:02", "remaining_time": "4:56:43"}
|
| 310 |
+
{"current_steps": 475, "total_steps": 1230, "loss": 0.5896, "lr": 3.0823666016478716e-05, "epoch": 1.9240506329113924, "percentage": 38.62, "elapsed_time": "3:06:24", "remaining_time": "4:56:16"}
|
| 311 |
+
{"current_steps": 476, "total_steps": 1230, "loss": 0.576, "lr": 3.0775893860614896e-05, "epoch": 1.928101265822785, "percentage": 38.7, "elapsed_time": "3:06:50", "remaining_time": "4:55:58"}
|
| 312 |
+
{"current_steps": 477, "total_steps": 1230, "loss": 0.566, "lr": 3.0728034917183336e-05, "epoch": 1.9321518987341773, "percentage": 38.78, "elapsed_time": "3:07:14", "remaining_time": "4:55:34"}
|
| 313 |
+
{"current_steps": 478, "total_steps": 1230, "loss": 0.553, "lr": 3.06800895716334e-05, "epoch": 1.9362025316455695, "percentage": 38.86, "elapsed_time": "3:07:36", "remaining_time": "4:55:09"}
|
| 314 |
+
{"current_steps": 479, "total_steps": 1230, "loss": 0.5559, "lr": 3.063205821011029e-05, "epoch": 1.940253164556962, "percentage": 38.94, "elapsed_time": "3:08:03", "remaining_time": "4:54:51"}
|
| 315 |
+
{"current_steps": 480, "total_steps": 1230, "loss": 0.5519, "lr": 3.0583941219452016e-05, "epoch": 1.9443037974683546, "percentage": 39.02, "elapsed_time": "3:08:32", "remaining_time": "4:54:36"}
|
| 316 |
+
{"current_steps": 481, "total_steps": 1230, "loss": 0.5726, "lr": 3.053573898718618e-05, "epoch": 1.9483544303797469, "percentage": 39.11, "elapsed_time": "3:08:53", "remaining_time": "4:54:08"}
|
| 317 |
+
{"current_steps": 482, "total_steps": 1230, "loss": 0.58, "lr": 3.0487451901526956e-05, "epoch": 1.9524050632911392, "percentage": 39.19, "elapsed_time": "3:09:18", "remaining_time": "4:53:47"}
|
| 318 |
+
{"current_steps": 483, "total_steps": 1230, "loss": 0.5724, "lr": 3.0439080351371875e-05, "epoch": 1.9564556962025317, "percentage": 39.27, "elapsed_time": "3:09:46", "remaining_time": "4:53:29"}
|
| 319 |
+
{"current_steps": 484, "total_steps": 1230, "loss": 0.5824, "lr": 3.0390624726298764e-05, "epoch": 1.9605063291139242, "percentage": 39.35, "elapsed_time": "3:10:06", "remaining_time": "4:53:01"}
|
| 320 |
+
{"current_steps": 485, "total_steps": 1230, "loss": 0.5561, "lr": 3.034208541656255e-05, "epoch": 1.9645569620253165, "percentage": 39.43, "elapsed_time": "3:10:32", "remaining_time": "4:52:40"}
|
| 321 |
+
{"current_steps": 486, "total_steps": 1230, "loss": 0.5714, "lr": 3.029346281309218e-05, "epoch": 1.9686075949367088, "percentage": 39.51, "elapsed_time": "3:10:51", "remaining_time": "4:52:11"}
|
| 322 |
+
{"current_steps": 487, "total_steps": 1230, "loss": 0.558, "lr": 3.0244757307487415e-05, "epoch": 1.9726582278481013, "percentage": 39.59, "elapsed_time": "3:11:13", "remaining_time": "4:51:44"}
|
| 323 |
+
{"current_steps": 488, "total_steps": 1230, "loss": 0.5634, "lr": 3.019596929201569e-05, "epoch": 1.9767088607594938, "percentage": 39.67, "elapsed_time": "3:11:33", "remaining_time": "4:51:16"}
|
| 324 |
+
{"current_steps": 489, "total_steps": 1230, "loss": 0.5814, "lr": 3.0147099159608985e-05, "epoch": 1.980759493670886, "percentage": 39.76, "elapsed_time": "3:12:00", "remaining_time": "4:50:57"}
|
| 325 |
+
{"current_steps": 490, "total_steps": 1230, "loss": 0.5598, "lr": 3.0098147303860616e-05, "epoch": 1.9848101265822784, "percentage": 39.84, "elapsed_time": "3:12:21", "remaining_time": "4:50:30"}
|
| 326 |
+
{"current_steps": 491, "total_steps": 1230, "loss": 0.5646, "lr": 3.0049114119022117e-05, "epoch": 1.988860759493671, "percentage": 39.92, "elapsed_time": "3:12:46", "remaining_time": "4:50:09"}
|
| 327 |
+
{"current_steps": 492, "total_steps": 1230, "loss": 0.5839, "lr": 3.0000000000000004e-05, "epoch": 1.9929113924050634, "percentage": 40.0, "elapsed_time": "3:13:15", "remaining_time": "4:49:53"}
|
| 328 |
+
{"current_steps": 493, "total_steps": 1230, "loss": 0.5588, "lr": 2.995080534235264e-05, "epoch": 1.9969620253164557, "percentage": 40.08, "elapsed_time": "3:13:39", "remaining_time": "4:49:30"}
|
| 329 |
+
{"current_steps": 494, "total_steps": 1230, "loss": 0.5354, "lr": 2.9901530542287044e-05, "epoch": 2.001012658227848, "percentage": 40.16, "elapsed_time": "3:15:26", "remaining_time": "4:51:11"}
|
| 330 |
+
{"current_steps": 495, "total_steps": 1230, "loss": 0.3599, "lr": 2.9852175996655676e-05, "epoch": 2.0050632911392405, "percentage": 40.24, "elapsed_time": "3:15:48", "remaining_time": "4:50:45"}
|
| 331 |
+
{"current_steps": 496, "total_steps": 1230, "loss": 0.3608, "lr": 2.980274210295326e-05, "epoch": 2.009113924050633, "percentage": 40.33, "elapsed_time": "3:16:09", "remaining_time": "4:50:16"}
|
| 332 |
+
{"current_steps": 497, "total_steps": 1230, "loss": 0.3586, "lr": 2.9753229259313578e-05, "epoch": 2.013164556962025, "percentage": 40.41, "elapsed_time": "3:16:29", "remaining_time": "4:49:47"}
|
| 333 |
+
{"current_steps": 498, "total_steps": 1230, "loss": 0.354, "lr": 2.9703637864506274e-05, "epoch": 2.0172151898734176, "percentage": 40.49, "elapsed_time": "3:16:54", "remaining_time": "4:49:26"}
|
| 334 |
+
{"current_steps": 499, "total_steps": 1230, "loss": 0.3672, "lr": 2.965396831793362e-05, "epoch": 2.02126582278481, "percentage": 40.57, "elapsed_time": "3:17:14", "remaining_time": "4:48:56"}
|
| 335 |
+
{"current_steps": 500, "total_steps": 1230, "loss": 0.3814, "lr": 2.9604221019627316e-05, "epoch": 2.0253164556962027, "percentage": 40.65, "elapsed_time": "3:17:41", "remaining_time": "4:48:37"}
|