Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5594cbe80851ba820cc3fc8b32ffad74f9219873ecdac8b2064bf16f09ed9cd1
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:31f641aedb127b9fbc0b4f446eaa88759d5b538f5289380601ad94e9e40df981
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:73895e5b951a5183ba05f244ec8c9f57912ac60c65c0b3f555e007ae13223a9f
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f1c85c384b16da4d25f8b73c79781438b95cd2a6474592e9ceaac05bf5c2b521
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -542,3 +542,246 @@
|
|
| 542 |
{"current_steps": 299, "total_steps": 1215, "loss": 0.3985, "lr": 3.746709743578462e-05, "epoch": 1.2291880781089415, "percentage": 24.61, "elapsed_time": "1:56:27", "remaining_time": "5:56:46"}
|
| 543 |
{"current_steps": 300, "total_steps": 1215, "loss": 0.384, "lr": 3.7439024938728435e-05, "epoch": 1.2332990750256938, "percentage": 24.69, "elapsed_time": "1:56:49", "remaining_time": "5:56:20"}
|
| 544 |
{"current_steps": 301, "total_steps": 1215, "loss": 0.3908, "lr": 3.74108083690963e-05, "epoch": 1.2374100719424461, "percentage": 24.77, "elapsed_time": "1:57:12", "remaining_time": "5:55:54"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 542 |
{"current_steps": 299, "total_steps": 1215, "loss": 0.3985, "lr": 3.746709743578462e-05, "epoch": 1.2291880781089415, "percentage": 24.61, "elapsed_time": "1:56:27", "remaining_time": "5:56:46"}
|
| 543 |
{"current_steps": 300, "total_steps": 1215, "loss": 0.384, "lr": 3.7439024938728435e-05, "epoch": 1.2332990750256938, "percentage": 24.69, "elapsed_time": "1:56:49", "remaining_time": "5:56:20"}
|
| 544 |
{"current_steps": 301, "total_steps": 1215, "loss": 0.3908, "lr": 3.74108083690963e-05, "epoch": 1.2374100719424461, "percentage": 24.77, "elapsed_time": "1:57:12", "remaining_time": "5:55:54"}
|
| 545 |
+
{"current_steps": 302, "total_steps": 1215, "loss": 0.3869, "lr": 3.7382447959999514e-05, "epoch": 1.2415210688591984, "percentage": 24.86, "elapsed_time": "1:57:35", "remaining_time": "5:55:28"}
|
| 546 |
+
{"current_steps": 303, "total_steps": 1215, "loss": 0.3984, "lr": 3.7353943945737716e-05, "epoch": 1.2456320657759508, "percentage": 24.94, "elapsed_time": "1:57:57", "remaining_time": "5:55:01"}
|
| 547 |
+
{"current_steps": 304, "total_steps": 1215, "loss": 0.3908, "lr": 3.7325296561796936e-05, "epoch": 1.249743062692703, "percentage": 25.02, "elapsed_time": "1:58:20", "remaining_time": "5:54:36"}
|
| 548 |
+
{"current_steps": 305, "total_steps": 1215, "loss": 0.3789, "lr": 3.729650604484766e-05, "epoch": 1.2538540596094552, "percentage": 25.1, "elapsed_time": "1:58:43", "remaining_time": "5:54:13"}
|
| 549 |
+
{"current_steps": 306, "total_steps": 1215, "loss": 0.39, "lr": 3.7267572632742846e-05, "epoch": 1.2579650565262077, "percentage": 25.19, "elapsed_time": "1:59:05", "remaining_time": "5:53:46"}
|
| 550 |
+
{"current_steps": 307, "total_steps": 1215, "loss": 0.398, "lr": 3.7238496564516006e-05, "epoch": 1.2620760534429598, "percentage": 25.27, "elapsed_time": "1:59:29", "remaining_time": "5:53:24"}
|
| 551 |
+
{"current_steps": 308, "total_steps": 1215, "loss": 0.385, "lr": 3.720927808037921e-05, "epoch": 1.2661870503597124, "percentage": 25.35, "elapsed_time": "1:59:52", "remaining_time": "5:52:59"}
|
| 552 |
+
{"current_steps": 309, "total_steps": 1215, "loss": 0.3801, "lr": 3.717991742172106e-05, "epoch": 1.2702980472764644, "percentage": 25.43, "elapsed_time": "2:00:15", "remaining_time": "5:52:35"}
|
| 553 |
+
{"current_steps": 310, "total_steps": 1215, "loss": 0.3936, "lr": 3.7150414831104765e-05, "epoch": 1.274409044193217, "percentage": 25.51, "elapsed_time": "2:00:37", "remaining_time": "5:52:08"}
|
| 554 |
+
{"current_steps": 311, "total_steps": 1215, "loss": 0.3966, "lr": 3.712077055226611e-05, "epoch": 1.278520041109969, "percentage": 25.6, "elapsed_time": "2:00:59", "remaining_time": "5:51:42"}
|
| 555 |
+
{"current_steps": 312, "total_steps": 1215, "loss": 0.3863, "lr": 3.7090984830111415e-05, "epoch": 1.2826310380267214, "percentage": 25.68, "elapsed_time": "2:01:22", "remaining_time": "5:51:18"}
|
| 556 |
+
{"current_steps": 313, "total_steps": 1215, "loss": 0.4019, "lr": 3.7061057910715546e-05, "epoch": 1.2867420349434737, "percentage": 25.76, "elapsed_time": "2:01:45", "remaining_time": "5:50:52"}
|
| 557 |
+
{"current_steps": 314, "total_steps": 1215, "loss": 0.389, "lr": 3.703099004131988e-05, "epoch": 1.290853031860226, "percentage": 25.84, "elapsed_time": "2:02:08", "remaining_time": "5:50:28"}
|
| 558 |
+
{"current_steps": 315, "total_steps": 1215, "loss": 0.3826, "lr": 3.700078147033023e-05, "epoch": 1.2949640287769784, "percentage": 25.93, "elapsed_time": "2:02:31", "remaining_time": "5:50:03"}
|
| 559 |
+
{"current_steps": 316, "total_steps": 1215, "loss": 0.387, "lr": 3.697043244731484e-05, "epoch": 1.2990750256937307, "percentage": 26.01, "elapsed_time": "2:02:54", "remaining_time": "5:49:38"}
|
| 560 |
+
{"current_steps": 317, "total_steps": 1215, "loss": 0.3903, "lr": 3.693994322300228e-05, "epoch": 1.303186022610483, "percentage": 26.09, "elapsed_time": "2:03:16", "remaining_time": "5:49:13"}
|
| 561 |
+
{"current_steps": 318, "total_steps": 1215, "loss": 0.3907, "lr": 3.69093140492794e-05, "epoch": 1.3072970195272353, "percentage": 26.17, "elapsed_time": "2:03:38", "remaining_time": "5:48:46"}
|
| 562 |
+
{"current_steps": 319, "total_steps": 1215, "loss": 0.3884, "lr": 3.687854517918926e-05, "epoch": 1.3114080164439876, "percentage": 26.26, "elapsed_time": "2:04:02", "remaining_time": "5:48:23"}
|
| 563 |
+
{"current_steps": 320, "total_steps": 1215, "loss": 0.3897, "lr": 3.684763686692898e-05, "epoch": 1.31551901336074, "percentage": 26.34, "elapsed_time": "2:04:24", "remaining_time": "5:47:57"}
|
| 564 |
+
{"current_steps": 321, "total_steps": 1215, "loss": 0.3819, "lr": 3.681658936784773e-05, "epoch": 1.3196300102774923, "percentage": 26.42, "elapsed_time": "2:04:48", "remaining_time": "5:47:34"}
|
| 565 |
+
{"current_steps": 322, "total_steps": 1215, "loss": 0.4029, "lr": 3.678540293844455e-05, "epoch": 1.3237410071942446, "percentage": 26.5, "elapsed_time": "2:05:10", "remaining_time": "5:47:07"}
|
| 566 |
+
{"current_steps": 323, "total_steps": 1215, "loss": 0.3888, "lr": 3.675407783636624e-05, "epoch": 1.327852004110997, "percentage": 26.58, "elapsed_time": "2:05:32", "remaining_time": "5:46:42"}
|
| 567 |
+
{"current_steps": 324, "total_steps": 1215, "loss": 0.388, "lr": 3.672261432040527e-05, "epoch": 1.3319630010277492, "percentage": 26.67, "elapsed_time": "2:05:56", "remaining_time": "5:46:21"}
|
| 568 |
+
{"current_steps": 325, "total_steps": 1215, "loss": 0.3949, "lr": 3.6691012650497605e-05, "epoch": 1.3360739979445015, "percentage": 26.75, "elapsed_time": "2:06:17", "remaining_time": "5:45:51"}
|
| 569 |
+
{"current_steps": 326, "total_steps": 1215, "loss": 0.3801, "lr": 3.665927308772057e-05, "epoch": 1.3401849948612539, "percentage": 26.83, "elapsed_time": "2:06:41", "remaining_time": "5:45:28"}
|
| 570 |
+
{"current_steps": 327, "total_steps": 1215, "loss": 0.4011, "lr": 3.6627395894290685e-05, "epoch": 1.3442959917780062, "percentage": 26.91, "elapsed_time": "2:07:03", "remaining_time": "5:45:02"}
|
| 571 |
+
{"current_steps": 328, "total_steps": 1215, "loss": 0.3841, "lr": 3.659538133356153e-05, "epoch": 1.3484069886947585, "percentage": 27.0, "elapsed_time": "2:07:26", "remaining_time": "5:44:39"}
|
| 572 |
+
{"current_steps": 329, "total_steps": 1215, "loss": 0.3798, "lr": 3.656322967002151e-05, "epoch": 1.3525179856115108, "percentage": 27.08, "elapsed_time": "2:07:49", "remaining_time": "5:44:14"}
|
| 573 |
+
{"current_steps": 330, "total_steps": 1215, "loss": 0.3769, "lr": 3.6530941169291744e-05, "epoch": 1.3566289825282631, "percentage": 27.16, "elapsed_time": "2:08:13", "remaining_time": "5:43:51"}
|
| 574 |
+
{"current_steps": 331, "total_steps": 1215, "loss": 0.4005, "lr": 3.649851609812379e-05, "epoch": 1.3607399794450155, "percentage": 27.24, "elapsed_time": "2:08:36", "remaining_time": "5:43:27"}
|
| 575 |
+
{"current_steps": 332, "total_steps": 1215, "loss": 0.3812, "lr": 3.646595472439753e-05, "epoch": 1.3648509763617678, "percentage": 27.33, "elapsed_time": "2:08:58", "remaining_time": "5:43:02"}
|
| 576 |
+
{"current_steps": 333, "total_steps": 1215, "loss": 0.3949, "lr": 3.643325731711888e-05, "epoch": 1.36896197327852, "percentage": 27.41, "elapsed_time": "2:09:22", "remaining_time": "5:42:39"}
|
| 577 |
+
{"current_steps": 334, "total_steps": 1215, "loss": 0.3951, "lr": 3.6400424146417604e-05, "epoch": 1.3730729701952724, "percentage": 27.49, "elapsed_time": "2:09:46", "remaining_time": "5:42:18"}
|
| 578 |
+
{"current_steps": 335, "total_steps": 1215, "loss": 0.3886, "lr": 3.6367455483545066e-05, "epoch": 1.3771839671120247, "percentage": 27.57, "elapsed_time": "2:10:09", "remaining_time": "5:41:54"}
|
| 579 |
+
{"current_steps": 336, "total_steps": 1215, "loss": 0.3833, "lr": 3.633435160087202e-05, "epoch": 1.381294964028777, "percentage": 27.65, "elapsed_time": "2:10:33", "remaining_time": "5:41:32"}
|
| 580 |
+
{"current_steps": 337, "total_steps": 1215, "loss": 0.3947, "lr": 3.6301112771886315e-05, "epoch": 1.3854059609455294, "percentage": 27.74, "elapsed_time": "2:10:56", "remaining_time": "5:41:08"}
|
| 581 |
+
{"current_steps": 338, "total_steps": 1215, "loss": 0.39, "lr": 3.62677392711907e-05, "epoch": 1.3895169578622815, "percentage": 27.82, "elapsed_time": "2:11:17", "remaining_time": "5:40:40"}
|
| 582 |
+
{"current_steps": 339, "total_steps": 1215, "loss": 0.3912, "lr": 3.623423137450046e-05, "epoch": 1.393627954779034, "percentage": 27.9, "elapsed_time": "2:11:40", "remaining_time": "5:40:15"}
|
| 583 |
+
{"current_steps": 340, "total_steps": 1215, "loss": 0.3902, "lr": 3.620058935864123e-05, "epoch": 1.397738951695786, "percentage": 27.98, "elapsed_time": "2:12:03", "remaining_time": "5:39:50"}
|
| 584 |
+
{"current_steps": 341, "total_steps": 1215, "loss": 0.3817, "lr": 3.616681350154666e-05, "epoch": 1.4018499486125386, "percentage": 28.07, "elapsed_time": "2:12:26", "remaining_time": "5:39:26"}
|
| 585 |
+
{"current_steps": 342, "total_steps": 1215, "loss": 0.3827, "lr": 3.613290408225615e-05, "epoch": 1.4059609455292907, "percentage": 28.15, "elapsed_time": "2:12:49", "remaining_time": "5:39:02"}
|
| 586 |
+
{"current_steps": 343, "total_steps": 1215, "loss": 0.3874, "lr": 3.609886138091247e-05, "epoch": 1.4100719424460433, "percentage": 28.23, "elapsed_time": "2:13:11", "remaining_time": "5:38:37"}
|
| 587 |
+
{"current_steps": 344, "total_steps": 1215, "loss": 0.3863, "lr": 3.606468567875957e-05, "epoch": 1.4141829393627954, "percentage": 28.31, "elapsed_time": "2:13:34", "remaining_time": "5:38:11"}
|
| 588 |
+
{"current_steps": 345, "total_steps": 1215, "loss": 0.3878, "lr": 3.603037725814014e-05, "epoch": 1.418293936279548, "percentage": 28.4, "elapsed_time": "2:13:57", "remaining_time": "5:37:48"}
|
| 589 |
+
{"current_steps": 346, "total_steps": 1215, "loss": 0.3775, "lr": 3.599593640249334e-05, "epoch": 1.4224049331963, "percentage": 28.48, "elapsed_time": "2:14:19", "remaining_time": "5:37:23"}
|
| 590 |
+
{"current_steps": 347, "total_steps": 1215, "loss": 0.3878, "lr": 3.5961363396352435e-05, "epoch": 1.4265159301130523, "percentage": 28.56, "elapsed_time": "2:14:43", "remaining_time": "5:36:59"}
|
| 591 |
+
{"current_steps": 348, "total_steps": 1215, "loss": 0.3882, "lr": 3.592665852534246e-05, "epoch": 1.4306269270298047, "percentage": 28.64, "elapsed_time": "2:15:06", "remaining_time": "5:36:35"}
|
| 592 |
+
{"current_steps": 349, "total_steps": 1215, "loss": 0.3848, "lr": 3.589182207617785e-05, "epoch": 1.434737923946557, "percentage": 28.72, "elapsed_time": "2:15:27", "remaining_time": "5:36:08"}
|
| 593 |
+
{"current_steps": 350, "total_steps": 1215, "loss": 0.3737, "lr": 3.5856854336660075e-05, "epoch": 1.4388489208633093, "percentage": 28.81, "elapsed_time": "2:15:51", "remaining_time": "5:35:46"}
|
| 594 |
+
{"current_steps": 351, "total_steps": 1215, "loss": 0.394, "lr": 3.582175559567524e-05, "epoch": 1.4429599177800616, "percentage": 28.89, "elapsed_time": "2:16:14", "remaining_time": "5:35:21"}
|
| 595 |
+
{"current_steps": 352, "total_steps": 1215, "loss": 0.3924, "lr": 3.578652614319177e-05, "epoch": 1.447070914696814, "percentage": 28.97, "elapsed_time": "2:16:36", "remaining_time": "5:34:55"}
|
| 596 |
+
{"current_steps": 353, "total_steps": 1215, "loss": 0.3895, "lr": 3.575116627025791e-05, "epoch": 1.4511819116135662, "percentage": 29.05, "elapsed_time": "2:17:00", "remaining_time": "5:34:32"}
|
| 597 |
+
{"current_steps": 354, "total_steps": 1215, "loss": 0.3979, "lr": 3.571567626899939e-05, "epoch": 1.4552929085303186, "percentage": 29.14, "elapsed_time": "2:17:24", "remaining_time": "5:34:11"}
|
| 598 |
+
{"current_steps": 355, "total_steps": 1215, "loss": 0.3865, "lr": 3.568005643261701e-05, "epoch": 1.4594039054470709, "percentage": 29.22, "elapsed_time": "2:17:47", "remaining_time": "5:33:48"}
|
| 599 |
+
{"current_steps": 356, "total_steps": 1215, "loss": 0.3927, "lr": 3.5644307055384204e-05, "epoch": 1.4635149023638232, "percentage": 29.3, "elapsed_time": "2:18:09", "remaining_time": "5:33:22"}
|
| 600 |
+
{"current_steps": 357, "total_steps": 1215, "loss": 0.3906, "lr": 3.5608428432644574e-05, "epoch": 1.4676258992805755, "percentage": 29.38, "elapsed_time": "2:18:32", "remaining_time": "5:32:59"}
|
| 601 |
+
{"current_steps": 358, "total_steps": 1215, "loss": 0.3882, "lr": 3.557242086080953e-05, "epoch": 1.4717368961973278, "percentage": 29.47, "elapsed_time": "2:18:56", "remaining_time": "5:32:36"}
|
| 602 |
+
{"current_steps": 359, "total_steps": 1215, "loss": 0.3882, "lr": 3.5536284637355766e-05, "epoch": 1.4758478931140802, "percentage": 29.55, "elapsed_time": "2:19:20", "remaining_time": "5:32:14"}
|
| 603 |
+
{"current_steps": 360, "total_steps": 1215, "loss": 0.39, "lr": 3.5500020060822844e-05, "epoch": 1.4799588900308325, "percentage": 29.63, "elapsed_time": "2:19:42", "remaining_time": "5:31:49"}
|
| 604 |
+
{"current_steps": 361, "total_steps": 1215, "loss": 0.3919, "lr": 3.54636274308107e-05, "epoch": 1.4840698869475848, "percentage": 29.71, "elapsed_time": "2:20:05", "remaining_time": "5:31:23"}
|
| 605 |
+
{"current_steps": 362, "total_steps": 1215, "loss": 0.3841, "lr": 3.542710704797721e-05, "epoch": 1.4881808838643371, "percentage": 29.79, "elapsed_time": "2:20:27", "remaining_time": "5:30:57"}
|
| 606 |
+
{"current_steps": 363, "total_steps": 1215, "loss": 0.375, "lr": 3.539045921403566e-05, "epoch": 1.4922918807810894, "percentage": 29.88, "elapsed_time": "2:20:49", "remaining_time": "5:30:32"}
|
| 607 |
+
{"current_steps": 364, "total_steps": 1215, "loss": 0.3884, "lr": 3.5353684231752276e-05, "epoch": 1.4964028776978417, "percentage": 29.96, "elapsed_time": "2:21:11", "remaining_time": "5:30:06"}
|
| 608 |
+
{"current_steps": 365, "total_steps": 1215, "loss": 0.3953, "lr": 3.531678240494373e-05, "epoch": 1.500513874614594, "percentage": 30.04, "elapsed_time": "2:21:34", "remaining_time": "5:29:40"}
|
| 609 |
+
{"current_steps": 366, "total_steps": 1215, "loss": 0.3864, "lr": 3.5279754038474616e-05, "epoch": 1.5046248715313464, "percentage": 30.12, "elapsed_time": "2:21:57", "remaining_time": "5:29:18"}
|
| 610 |
+
{"current_steps": 367, "total_steps": 1215, "loss": 0.3864, "lr": 3.524259943825493e-05, "epoch": 1.5087358684480987, "percentage": 30.21, "elapsed_time": "2:22:21", "remaining_time": "5:28:55"}
|
| 611 |
+
{"current_steps": 368, "total_steps": 1215, "loss": 0.3829, "lr": 3.5205318911237566e-05, "epoch": 1.512846865364851, "percentage": 30.29, "elapsed_time": "2:22:44", "remaining_time": "5:28:33"}
|
| 612 |
+
{"current_steps": 369, "total_steps": 1215, "loss": 0.391, "lr": 3.516791276541574e-05, "epoch": 1.5169578622816033, "percentage": 30.37, "elapsed_time": "2:23:08", "remaining_time": "5:28:09"}
|
| 613 |
+
{"current_steps": 370, "total_steps": 1215, "loss": 0.3852, "lr": 3.5130381309820474e-05, "epoch": 1.5210688591983557, "percentage": 30.45, "elapsed_time": "2:23:31", "remaining_time": "5:27:46"}
|
| 614 |
+
{"current_steps": 371, "total_steps": 1215, "loss": 0.3813, "lr": 3.509272485451806e-05, "epoch": 1.5251798561151078, "percentage": 30.53, "elapsed_time": "2:23:54", "remaining_time": "5:27:22"}
|
| 615 |
+
{"current_steps": 372, "total_steps": 1215, "loss": 0.3943, "lr": 3.5054943710607435e-05, "epoch": 1.5292908530318603, "percentage": 30.62, "elapsed_time": "2:24:16", "remaining_time": "5:26:57"}
|
| 616 |
+
{"current_steps": 373, "total_steps": 1215, "loss": 0.3813, "lr": 3.50170381902177e-05, "epoch": 1.5334018499486124, "percentage": 30.7, "elapsed_time": "2:24:39", "remaining_time": "5:26:33"}
|
| 617 |
+
{"current_steps": 374, "total_steps": 1215, "loss": 0.3818, "lr": 3.497900860650545e-05, "epoch": 1.537512846865365, "percentage": 30.78, "elapsed_time": "2:25:02", "remaining_time": "5:26:09"}
|
| 618 |
+
{"current_steps": 375, "total_steps": 1215, "loss": 0.3759, "lr": 3.494085527365224e-05, "epoch": 1.541623843782117, "percentage": 30.86, "elapsed_time": "2:25:26", "remaining_time": "5:25:47"}
|
| 619 |
+
{"current_steps": 376, "total_steps": 1215, "loss": 0.3893, "lr": 3.4902578506861995e-05, "epoch": 1.5457348406988696, "percentage": 30.95, "elapsed_time": "2:25:49", "remaining_time": "5:25:23"}
|
| 620 |
+
{"current_steps": 377, "total_steps": 1215, "loss": 0.3905, "lr": 3.486417862235839e-05, "epoch": 1.5498458376156217, "percentage": 31.03, "elapsed_time": "2:26:13", "remaining_time": "5:25:00"}
|
| 621 |
+
{"current_steps": 378, "total_steps": 1215, "loss": 0.3865, "lr": 3.4825655937382216e-05, "epoch": 1.5539568345323742, "percentage": 31.11, "elapsed_time": "2:26:36", "remaining_time": "5:24:37"}
|
| 622 |
+
{"current_steps": 379, "total_steps": 1215, "loss": 0.3932, "lr": 3.4787010770188795e-05, "epoch": 1.5580678314491263, "percentage": 31.19, "elapsed_time": "2:26:59", "remaining_time": "5:24:13"}
|
| 623 |
+
{"current_steps": 380, "total_steps": 1215, "loss": 0.3906, "lr": 3.474824344004534e-05, "epoch": 1.5621788283658788, "percentage": 31.28, "elapsed_time": "2:27:21", "remaining_time": "5:23:48"}
|
| 624 |
+
{"current_steps": 381, "total_steps": 1215, "loss": 0.3783, "lr": 3.4709354267228294e-05, "epoch": 1.566289825282631, "percentage": 31.36, "elapsed_time": "2:27:45", "remaining_time": "5:23:26"}
|
| 625 |
+
{"current_steps": 382, "total_steps": 1215, "loss": 0.3816, "lr": 3.467034357302073e-05, "epoch": 1.5704008221993835, "percentage": 31.44, "elapsed_time": "2:28:08", "remaining_time": "5:23:01"}
|
| 626 |
+
{"current_steps": 383, "total_steps": 1215, "loss": 0.3843, "lr": 3.463121167970966e-05, "epoch": 1.5745118191161356, "percentage": 31.52, "elapsed_time": "2:28:31", "remaining_time": "5:22:39"}
|
| 627 |
+
{"current_steps": 384, "total_steps": 1215, "loss": 0.3871, "lr": 3.4591958910583365e-05, "epoch": 1.5786228160328881, "percentage": 31.6, "elapsed_time": "2:28:55", "remaining_time": "5:22:16"}
|
| 628 |
+
{"current_steps": 385, "total_steps": 1215, "loss": 0.379, "lr": 3.455258558992877e-05, "epoch": 1.5827338129496402, "percentage": 31.69, "elapsed_time": "2:29:17", "remaining_time": "5:21:51"}
|
| 629 |
+
{"current_steps": 386, "total_steps": 1215, "loss": 0.3801, "lr": 3.451309204302873e-05, "epoch": 1.5868448098663928, "percentage": 31.77, "elapsed_time": "2:29:41", "remaining_time": "5:21:28"}
|
| 630 |
+
{"current_steps": 387, "total_steps": 1215, "loss": 0.379, "lr": 3.447347859615933e-05, "epoch": 1.5909558067831449, "percentage": 31.85, "elapsed_time": "2:30:04", "remaining_time": "5:21:05"}
|
| 631 |
+
{"current_steps": 388, "total_steps": 1215, "loss": 0.3745, "lr": 3.443374557658723e-05, "epoch": 1.5950668036998972, "percentage": 31.93, "elapsed_time": "2:30:26", "remaining_time": "5:20:38"}
|
| 632 |
+
{"current_steps": 389, "total_steps": 1215, "loss": 0.3807, "lr": 3.439389331256694e-05, "epoch": 1.5991778006166495, "percentage": 32.02, "elapsed_time": "2:30:48", "remaining_time": "5:20:14"}
|
| 633 |
+
{"current_steps": 390, "total_steps": 1215, "loss": 0.3832, "lr": 3.435392213333809e-05, "epoch": 1.6032887975334018, "percentage": 32.1, "elapsed_time": "2:31:10", "remaining_time": "5:19:47"}
|
| 634 |
+
{"current_steps": 391, "total_steps": 1215, "loss": 0.3692, "lr": 3.431383236912275e-05, "epoch": 1.6073997944501541, "percentage": 32.18, "elapsed_time": "2:31:34", "remaining_time": "5:19:25"}
|
| 635 |
+
{"current_steps": 392, "total_steps": 1215, "loss": 0.3728, "lr": 3.427362435112268e-05, "epoch": 1.6115107913669064, "percentage": 32.26, "elapsed_time": "2:31:57", "remaining_time": "5:19:01"}
|
| 636 |
+
{"current_steps": 393, "total_steps": 1215, "loss": 0.3868, "lr": 3.423329841151656e-05, "epoch": 1.6156217882836588, "percentage": 32.35, "elapsed_time": "2:32:18", "remaining_time": "5:18:33"}
|
| 637 |
+
{"current_steps": 394, "total_steps": 1215, "loss": 0.3724, "lr": 3.4192854883457326e-05, "epoch": 1.619732785200411, "percentage": 32.43, "elapsed_time": "2:32:42", "remaining_time": "5:18:11"}
|
| 638 |
+
{"current_steps": 395, "total_steps": 1215, "loss": 0.3755, "lr": 3.4152294101069345e-05, "epoch": 1.6238437821171634, "percentage": 32.51, "elapsed_time": "2:33:04", "remaining_time": "5:17:46"}
|
| 639 |
+
{"current_steps": 396, "total_steps": 1215, "loss": 0.3866, "lr": 3.411161639944568e-05, "epoch": 1.6279547790339157, "percentage": 32.59, "elapsed_time": "2:33:26", "remaining_time": "5:17:21"}
|
| 640 |
+
{"current_steps": 397, "total_steps": 1215, "loss": 0.3842, "lr": 3.407082211464534e-05, "epoch": 1.632065775950668, "percentage": 32.67, "elapsed_time": "2:33:49", "remaining_time": "5:16:57"}
|
| 641 |
+
{"current_steps": 398, "total_steps": 1215, "loss": 0.3856, "lr": 3.402991158369047e-05, "epoch": 1.6361767728674204, "percentage": 32.76, "elapsed_time": "2:34:13", "remaining_time": "5:16:35"}
|
| 642 |
+
{"current_steps": 399, "total_steps": 1215, "loss": 0.3738, "lr": 3.39888851445636e-05, "epoch": 1.6402877697841727, "percentage": 32.84, "elapsed_time": "2:34:36", "remaining_time": "5:16:11"}
|
| 643 |
+
{"current_steps": 400, "total_steps": 1215, "loss": 0.3768, "lr": 3.394774313620481e-05, "epoch": 1.644398766700925, "percentage": 32.92, "elapsed_time": "2:34:59", "remaining_time": "5:15:47"}
|
| 644 |
+
{"current_steps": 401, "total_steps": 1215, "loss": 0.3854, "lr": 3.390648589850897e-05, "epoch": 1.6485097636176773, "percentage": 33.0, "elapsed_time": "2:35:22", "remaining_time": "5:15:24"}
|
| 645 |
+
{"current_steps": 402, "total_steps": 1215, "loss": 0.383, "lr": 3.386511377232293e-05, "epoch": 1.6526207605344296, "percentage": 33.09, "elapsed_time": "2:35:45", "remaining_time": "5:15:00"}
|
| 646 |
+
{"current_steps": 403, "total_steps": 1215, "loss": 0.3913, "lr": 3.382362709944268e-05, "epoch": 1.656731757451182, "percentage": 33.17, "elapsed_time": "2:36:08", "remaining_time": "5:14:36"}
|
| 647 |
+
{"current_steps": 404, "total_steps": 1215, "loss": 0.3912, "lr": 3.3782026222610525e-05, "epoch": 1.6608427543679343, "percentage": 33.25, "elapsed_time": "2:36:32", "remaining_time": "5:14:14"}
|
| 648 |
+
{"current_steps": 405, "total_steps": 1215, "loss": 0.3785, "lr": 3.374031148551229e-05, "epoch": 1.6649537512846866, "percentage": 33.33, "elapsed_time": "2:36:55", "remaining_time": "5:13:51"}
|
| 649 |
+
{"current_steps": 406, "total_steps": 1215, "loss": 0.3811, "lr": 3.3698483232774435e-05, "epoch": 1.6690647482014387, "percentage": 33.42, "elapsed_time": "2:37:19", "remaining_time": "5:13:28"}
|
| 650 |
+
{"current_steps": 407, "total_steps": 1215, "loss": 0.3765, "lr": 3.365654180996126e-05, "epoch": 1.6731757451181912, "percentage": 33.5, "elapsed_time": "2:37:42", "remaining_time": "5:13:05"}
|
| 651 |
+
{"current_steps": 408, "total_steps": 1215, "loss": 0.3855, "lr": 3.361448756357199e-05, "epoch": 1.6772867420349433, "percentage": 33.58, "elapsed_time": "2:38:05", "remaining_time": "5:12:41"}
|
| 652 |
+
{"current_steps": 409, "total_steps": 1215, "loss": 0.3776, "lr": 3.3572320841037945e-05, "epoch": 1.6813977389516959, "percentage": 33.66, "elapsed_time": "2:38:27", "remaining_time": "5:12:16"}
|
| 653 |
+
{"current_steps": 410, "total_steps": 1215, "loss": 0.389, "lr": 3.353004199071969e-05, "epoch": 1.685508735868448, "percentage": 33.74, "elapsed_time": "2:38:51", "remaining_time": "5:11:54"}
|
| 654 |
+
{"current_steps": 411, "total_steps": 1215, "loss": 0.3844, "lr": 3.348765136190412e-05, "epoch": 1.6896197327852005, "percentage": 33.83, "elapsed_time": "2:39:14", "remaining_time": "5:11:30"}
|
| 655 |
+
{"current_steps": 412, "total_steps": 1215, "loss": 0.3718, "lr": 3.344514930480158e-05, "epoch": 1.6937307297019526, "percentage": 33.91, "elapsed_time": "2:39:37", "remaining_time": "5:11:05"}
|
| 656 |
+
{"current_steps": 413, "total_steps": 1215, "loss": 0.4017, "lr": 3.3402536170542985e-05, "epoch": 1.6978417266187051, "percentage": 33.99, "elapsed_time": "2:39:59", "remaining_time": "5:10:41"}
|
| 657 |
+
{"current_steps": 414, "total_steps": 1215, "loss": 0.3786, "lr": 3.335981231117694e-05, "epoch": 1.7019527235354572, "percentage": 34.07, "elapsed_time": "2:40:21", "remaining_time": "5:10:15"}
|
| 658 |
+
{"current_steps": 415, "total_steps": 1215, "loss": 0.3902, "lr": 3.331697807966676e-05, "epoch": 1.7060637204522098, "percentage": 34.16, "elapsed_time": "2:40:45", "remaining_time": "5:09:53"}
|
| 659 |
+
{"current_steps": 416, "total_steps": 1215, "loss": 0.382, "lr": 3.327403382988764e-05, "epoch": 1.7101747173689619, "percentage": 34.24, "elapsed_time": "2:41:07", "remaining_time": "5:09:29"}
|
| 660 |
+
{"current_steps": 417, "total_steps": 1215, "loss": 0.3868, "lr": 3.3230979916623667e-05, "epoch": 1.7142857142857144, "percentage": 34.32, "elapsed_time": "2:41:30", "remaining_time": "5:09:04"}
|
| 661 |
+
{"current_steps": 418, "total_steps": 1215, "loss": 0.4025, "lr": 3.318781669556493e-05, "epoch": 1.7183967112024665, "percentage": 34.4, "elapsed_time": "2:41:52", "remaining_time": "5:08:38"}
|
| 662 |
+
{"current_steps": 419, "total_steps": 1215, "loss": 0.3868, "lr": 3.3144544523304545e-05, "epoch": 1.722507708119219, "percentage": 34.49, "elapsed_time": "2:42:15", "remaining_time": "5:08:14"}
|
| 663 |
+
{"current_steps": 420, "total_steps": 1215, "loss": 0.3848, "lr": 3.310116375733575e-05, "epoch": 1.7266187050359711, "percentage": 34.57, "elapsed_time": "2:42:38", "remaining_time": "5:07:51"}
|
| 664 |
+
{"current_steps": 421, "total_steps": 1215, "loss": 0.3884, "lr": 3.3057674756048906e-05, "epoch": 1.7307297019527237, "percentage": 34.65, "elapsed_time": "2:43:01", "remaining_time": "5:07:27"}
|
| 665 |
+
{"current_steps": 422, "total_steps": 1215, "loss": 0.3962, "lr": 3.30140778787286e-05, "epoch": 1.7348406988694758, "percentage": 34.73, "elapsed_time": "2:43:22", "remaining_time": "5:07:00"}
|
| 666 |
+
{"current_steps": 423, "total_steps": 1215, "loss": 0.3804, "lr": 3.297037348555059e-05, "epoch": 1.7389516957862283, "percentage": 34.81, "elapsed_time": "2:43:45", "remaining_time": "5:06:36"}
|
| 667 |
+
{"current_steps": 424, "total_steps": 1215, "loss": 0.3808, "lr": 3.292656193757891e-05, "epoch": 1.7430626927029804, "percentage": 34.9, "elapsed_time": "2:44:09", "remaining_time": "5:06:14"}
|
| 668 |
+
{"current_steps": 425, "total_steps": 1215, "loss": 0.3766, "lr": 3.2882643596762847e-05, "epoch": 1.7471736896197327, "percentage": 34.98, "elapsed_time": "2:44:32", "remaining_time": "5:05:50"}
|
| 669 |
+
{"current_steps": 426, "total_steps": 1215, "loss": 0.3629, "lr": 3.283861882593394e-05, "epoch": 1.751284686536485, "percentage": 35.06, "elapsed_time": "2:44:53", "remaining_time": "5:05:24"}
|
| 670 |
+
{"current_steps": 427, "total_steps": 1215, "loss": 0.3946, "lr": 3.2794487988803024e-05, "epoch": 1.7553956834532374, "percentage": 35.14, "elapsed_time": "2:45:17", "remaining_time": "5:05:01"}
|
| 671 |
+
{"current_steps": 428, "total_steps": 1215, "loss": 0.3826, "lr": 3.275025144995719e-05, "epoch": 1.7595066803699897, "percentage": 35.23, "elapsed_time": "2:45:39", "remaining_time": "5:04:36"}
|
| 672 |
+
{"current_steps": 429, "total_steps": 1215, "loss": 0.3822, "lr": 3.270590957485678e-05, "epoch": 1.763617677286742, "percentage": 35.31, "elapsed_time": "2:46:02", "remaining_time": "5:04:12"}
|
| 673 |
+
{"current_steps": 430, "total_steps": 1215, "loss": 0.379, "lr": 3.266146272983238e-05, "epoch": 1.7677286742034943, "percentage": 35.39, "elapsed_time": "2:46:24", "remaining_time": "5:03:48"}
|
| 674 |
+
{"current_steps": 431, "total_steps": 1215, "loss": 0.3781, "lr": 3.261691128208178e-05, "epoch": 1.7718396711202467, "percentage": 35.47, "elapsed_time": "2:46:47", "remaining_time": "5:03:23"}
|
| 675 |
+
{"current_steps": 432, "total_steps": 1215, "loss": 0.3858, "lr": 3.2572255599666946e-05, "epoch": 1.775950668036999, "percentage": 35.56, "elapsed_time": "2:47:11", "remaining_time": "5:03:01"}
|
| 676 |
+
{"current_steps": 433, "total_steps": 1215, "loss": 0.3889, "lr": 3.252749605151099e-05, "epoch": 1.7800616649537513, "percentage": 35.64, "elapsed_time": "2:47:34", "remaining_time": "5:02:38"}
|
| 677 |
+
{"current_steps": 434, "total_steps": 1215, "loss": 0.3828, "lr": 3.24826330073951e-05, "epoch": 1.7841726618705036, "percentage": 35.72, "elapsed_time": "2:47:56", "remaining_time": "5:02:13"}
|
| 678 |
+
{"current_steps": 435, "total_steps": 1215, "loss": 0.3821, "lr": 3.2437666837955495e-05, "epoch": 1.788283658787256, "percentage": 35.8, "elapsed_time": "2:48:17", "remaining_time": "5:01:45"}
|
| 679 |
+
{"current_steps": 436, "total_steps": 1215, "loss": 0.3782, "lr": 3.239259791468037e-05, "epoch": 1.7923946557040082, "percentage": 35.88, "elapsed_time": "2:48:40", "remaining_time": "5:01:22"}
|
| 680 |
+
{"current_steps": 437, "total_steps": 1215, "loss": 0.3886, "lr": 3.234742660990681e-05, "epoch": 1.7965056526207606, "percentage": 35.97, "elapsed_time": "2:49:02", "remaining_time": "5:00:56"}
|
| 681 |
+
{"current_steps": 438, "total_steps": 1215, "loss": 0.3865, "lr": 3.230215329681775e-05, "epoch": 1.8006166495375129, "percentage": 36.05, "elapsed_time": "2:49:25", "remaining_time": "5:00:33"}
|
| 682 |
+
{"current_steps": 439, "total_steps": 1215, "loss": 0.3798, "lr": 3.225677834943884e-05, "epoch": 1.8047276464542652, "percentage": 36.13, "elapsed_time": "2:49:48", "remaining_time": "5:00:10"}
|
| 683 |
+
{"current_steps": 440, "total_steps": 1215, "loss": 0.371, "lr": 3.22113021426354e-05, "epoch": 1.8088386433710175, "percentage": 36.21, "elapsed_time": "2:50:11", "remaining_time": "4:59:46"}
|
| 684 |
+
{"current_steps": 441, "total_steps": 1215, "loss": 0.386, "lr": 3.216572505210929e-05, "epoch": 1.8129496402877698, "percentage": 36.3, "elapsed_time": "2:50:35", "remaining_time": "4:59:23"}
|
| 685 |
+
{"current_steps": 442, "total_steps": 1215, "loss": 0.3837, "lr": 3.2120047454395845e-05, "epoch": 1.8170606372045222, "percentage": 36.38, "elapsed_time": "2:50:58", "remaining_time": "4:59:01"}
|
| 686 |
+
{"current_steps": 443, "total_steps": 1215, "loss": 0.3892, "lr": 3.207426972686071e-05, "epoch": 1.8211716341212743, "percentage": 36.46, "elapsed_time": "2:51:21", "remaining_time": "4:58:36"}
|
| 687 |
+
{"current_steps": 444, "total_steps": 1215, "loss": 0.3911, "lr": 3.202839224769678e-05, "epoch": 1.8252826310380268, "percentage": 36.54, "elapsed_time": "2:51:43", "remaining_time": "4:58:12"}
|
| 688 |
+
{"current_steps": 445, "total_steps": 1215, "loss": 0.388, "lr": 3.198241539592103e-05, "epoch": 1.829393627954779, "percentage": 36.63, "elapsed_time": "2:52:06", "remaining_time": "4:57:48"}
|
| 689 |
+
{"current_steps": 446, "total_steps": 1215, "loss": 0.3733, "lr": 3.1936339551371416e-05, "epoch": 1.8335046248715314, "percentage": 36.71, "elapsed_time": "2:52:29", "remaining_time": "4:57:24"}
|
| 690 |
+
{"current_steps": 447, "total_steps": 1215, "loss": 0.382, "lr": 3.1890165094703704e-05, "epoch": 1.8376156217882835, "percentage": 36.79, "elapsed_time": "2:52:52", "remaining_time": "4:57:02"}
|
| 691 |
+
{"current_steps": 448, "total_steps": 1215, "loss": 0.3843, "lr": 3.184389240738838e-05, "epoch": 1.841726618705036, "percentage": 36.87, "elapsed_time": "2:53:16", "remaining_time": "4:56:39"}
|
| 692 |
+
{"current_steps": 449, "total_steps": 1215, "loss": 0.3914, "lr": 3.179752187170741e-05, "epoch": 1.8458376156217882, "percentage": 36.95, "elapsed_time": "2:53:39", "remaining_time": "4:56:16"}
|
| 693 |
+
{"current_steps": 450, "total_steps": 1215, "loss": 0.3843, "lr": 3.1751053870751184e-05, "epoch": 1.8499486125385407, "percentage": 37.04, "elapsed_time": "2:54:03", "remaining_time": "4:55:53"}
|
| 694 |
+
{"current_steps": 451, "total_steps": 1215, "loss": 0.3855, "lr": 3.1704488788415274e-05, "epoch": 1.8540596094552928, "percentage": 37.12, "elapsed_time": "2:54:26", "remaining_time": "4:55:29"}
|
| 695 |
+
{"current_steps": 452, "total_steps": 1215, "loss": 0.386, "lr": 3.16578270093973e-05, "epoch": 1.8581706063720453, "percentage": 37.2, "elapsed_time": "2:54:48", "remaining_time": "4:55:05"}
|
| 696 |
+
{"current_steps": 453, "total_steps": 1215, "loss": 0.3783, "lr": 3.1611068919193756e-05, "epoch": 1.8622816032887974, "percentage": 37.28, "elapsed_time": "2:55:10", "remaining_time": "4:54:40"}
|
| 697 |
+
{"current_steps": 454, "total_steps": 1215, "loss": 0.385, "lr": 3.1564214904096774e-05, "epoch": 1.86639260020555, "percentage": 37.37, "elapsed_time": "2:55:33", "remaining_time": "4:54:15"}
|
| 698 |
+
{"current_steps": 455, "total_steps": 1215, "loss": 0.3841, "lr": 3.1517265351191e-05, "epoch": 1.870503597122302, "percentage": 37.45, "elapsed_time": "2:55:54", "remaining_time": "4:53:49"}
|
| 699 |
+
{"current_steps": 456, "total_steps": 1215, "loss": 0.385, "lr": 3.147022064835036e-05, "epoch": 1.8746145940390546, "percentage": 37.53, "elapsed_time": "2:56:18", "remaining_time": "4:53:26"}
|
| 700 |
+
{"current_steps": 457, "total_steps": 1215, "loss": 0.3808, "lr": 3.142308118423485e-05, "epoch": 1.8787255909558067, "percentage": 37.61, "elapsed_time": "2:56:41", "remaining_time": "4:53:03"}
|
| 701 |
+
{"current_steps": 458, "total_steps": 1215, "loss": 0.3898, "lr": 3.1375847348287365e-05, "epoch": 1.8828365878725593, "percentage": 37.7, "elapsed_time": "2:57:03", "remaining_time": "4:52:39"}
|
| 702 |
+
{"current_steps": 459, "total_steps": 1215, "loss": 0.3823, "lr": 3.132851953073041e-05, "epoch": 1.8869475847893113, "percentage": 37.78, "elapsed_time": "2:57:25", "remaining_time": "4:52:13"}
|
| 703 |
+
{"current_steps": 460, "total_steps": 1215, "loss": 0.379, "lr": 3.128109812256296e-05, "epoch": 1.8910585817060637, "percentage": 37.86, "elapsed_time": "2:57:47", "remaining_time": "4:51:48"}
|
| 704 |
+
{"current_steps": 461, "total_steps": 1215, "loss": 0.3802, "lr": 3.1233583515557166e-05, "epoch": 1.895169578622816, "percentage": 37.94, "elapsed_time": "2:58:10", "remaining_time": "4:51:25"}
|
| 705 |
+
{"current_steps": 462, "total_steps": 1215, "loss": 0.3648, "lr": 3.118597610225514e-05, "epoch": 1.8992805755395683, "percentage": 38.02, "elapsed_time": "2:58:34", "remaining_time": "4:51:03"}
|
| 706 |
+
{"current_steps": 463, "total_steps": 1215, "loss": 0.3845, "lr": 3.113827627596575e-05, "epoch": 1.9033915724563206, "percentage": 38.11, "elapsed_time": "2:58:55", "remaining_time": "4:50:37"}
|
| 707 |
+
{"current_steps": 464, "total_steps": 1215, "loss": 0.3968, "lr": 3.1090484430761275e-05, "epoch": 1.907502569373073, "percentage": 38.19, "elapsed_time": "2:59:18", "remaining_time": "4:50:13"}
|
| 708 |
+
{"current_steps": 465, "total_steps": 1215, "loss": 0.3825, "lr": 3.104260096147426e-05, "epoch": 1.9116135662898253, "percentage": 38.27, "elapsed_time": "2:59:41", "remaining_time": "4:49:49"}
|
| 709 |
+
{"current_steps": 466, "total_steps": 1215, "loss": 0.379, "lr": 3.099462626369418e-05, "epoch": 1.9157245632065776, "percentage": 38.35, "elapsed_time": "3:00:04", "remaining_time": "4:49:26"}
|
| 710 |
+
{"current_steps": 467, "total_steps": 1215, "loss": 0.3882, "lr": 3.094656073376419e-05, "epoch": 1.91983556012333, "percentage": 38.44, "elapsed_time": "3:00:28", "remaining_time": "4:49:03"}
|
| 711 |
+
{"current_steps": 468, "total_steps": 1215, "loss": 0.3855, "lr": 3.0898404768777863e-05, "epoch": 1.9239465570400822, "percentage": 38.52, "elapsed_time": "3:00:51", "remaining_time": "4:48:40"}
|
| 712 |
+
{"current_steps": 469, "total_steps": 1215, "loss": 0.3843, "lr": 3.0850158766575907e-05, "epoch": 1.9280575539568345, "percentage": 38.6, "elapsed_time": "3:01:14", "remaining_time": "4:48:16"}
|
| 713 |
+
{"current_steps": 470, "total_steps": 1215, "loss": 0.3746, "lr": 3.080182312574286e-05, "epoch": 1.9321685508735869, "percentage": 38.68, "elapsed_time": "3:01:37", "remaining_time": "4:47:53"}
|
| 714 |
+
{"current_steps": 471, "total_steps": 1215, "loss": 0.3718, "lr": 3.075339824560382e-05, "epoch": 1.9362795477903392, "percentage": 38.77, "elapsed_time": "3:02:00", "remaining_time": "4:47:30"}
|
| 715 |
+
{"current_steps": 472, "total_steps": 1215, "loss": 0.3934, "lr": 3.070488452622113e-05, "epoch": 1.9403905447070915, "percentage": 38.85, "elapsed_time": "3:02:23", "remaining_time": "4:47:06"}
|
| 716 |
+
{"current_steps": 473, "total_steps": 1215, "loss": 0.3729, "lr": 3.0656282368391086e-05, "epoch": 1.9445015416238438, "percentage": 38.93, "elapsed_time": "3:02:45", "remaining_time": "4:46:42"}
|
| 717 |
+
{"current_steps": 474, "total_steps": 1215, "loss": 0.3795, "lr": 3.0607592173640615e-05, "epoch": 1.9486125385405961, "percentage": 39.01, "elapsed_time": "3:03:08", "remaining_time": "4:46:18"}
|
| 718 |
+
{"current_steps": 475, "total_steps": 1215, "loss": 0.3981, "lr": 3.055881434422395e-05, "epoch": 1.9527235354573484, "percentage": 39.09, "elapsed_time": "3:03:31", "remaining_time": "4:45:54"}
|
| 719 |
+
{"current_steps": 476, "total_steps": 1215, "loss": 0.3717, "lr": 3.0509949283119348e-05, "epoch": 1.9568345323741008, "percentage": 39.18, "elapsed_time": "3:03:54", "remaining_time": "4:45:31"}
|
| 720 |
+
{"current_steps": 477, "total_steps": 1215, "loss": 0.3993, "lr": 3.0460997394025694e-05, "epoch": 1.960945529290853, "percentage": 39.26, "elapsed_time": "3:04:17", "remaining_time": "4:45:08"}
|
| 721 |
+
{"current_steps": 478, "total_steps": 1215, "loss": 0.3865, "lr": 3.0411959081359223e-05, "epoch": 1.9650565262076052, "percentage": 39.34, "elapsed_time": "3:04:40", "remaining_time": "4:44:44"}
|
| 722 |
+
{"current_steps": 479, "total_steps": 1215, "loss": 0.3784, "lr": 3.036283475025016e-05, "epoch": 1.9691675231243577, "percentage": 39.42, "elapsed_time": "3:05:04", "remaining_time": "4:44:22"}
|
| 723 |
+
{"current_steps": 480, "total_steps": 1215, "loss": 0.3762, "lr": 3.031362480653937e-05, "epoch": 1.9732785200411098, "percentage": 39.51, "elapsed_time": "3:05:27", "remaining_time": "4:43:58"}
|
| 724 |
+
{"current_steps": 481, "total_steps": 1215, "loss": 0.3757, "lr": 3.0264329656775e-05, "epoch": 1.9773895169578624, "percentage": 39.59, "elapsed_time": "3:05:49", "remaining_time": "4:43:34"}
|
| 725 |
+
{"current_steps": 482, "total_steps": 1215, "loss": 0.3827, "lr": 3.021494970820912e-05, "epoch": 1.9815005138746145, "percentage": 39.67, "elapsed_time": "3:06:11", "remaining_time": "4:43:08"}
|
| 726 |
+
{"current_steps": 483, "total_steps": 1215, "loss": 0.3642, "lr": 3.01654853687944e-05, "epoch": 1.985611510791367, "percentage": 39.75, "elapsed_time": "3:06:34", "remaining_time": "4:42:45"}
|
| 727 |
+
{"current_steps": 484, "total_steps": 1215, "loss": 0.3963, "lr": 3.011593704718067e-05, "epoch": 1.989722507708119, "percentage": 39.84, "elapsed_time": "3:06:57", "remaining_time": "4:42:21"}
|
| 728 |
+
{"current_steps": 485, "total_steps": 1215, "loss": 0.3878, "lr": 3.0066305152711598e-05, "epoch": 1.9938335046248716, "percentage": 39.92, "elapsed_time": "3:07:21", "remaining_time": "4:41:59"}
|
| 729 |
+
{"current_steps": 486, "total_steps": 1215, "loss": 0.3721, "lr": 3.0016590095421273e-05, "epoch": 1.9979445015416237, "percentage": 40.0, "elapsed_time": "3:07:45", "remaining_time": "4:41:37"}
|
| 730 |
+
{"current_steps": 487, "total_steps": 1215, "loss": 0.3396, "lr": 2.9966792286030853e-05, "epoch": 2.0020554984583763, "percentage": 40.08, "elapsed_time": "3:09:49", "remaining_time": "4:43:45"}
|
| 731 |
+
{"current_steps": 488, "total_steps": 1215, "loss": 0.3326, "lr": 2.9916912135945147e-05, "epoch": 2.0061664953751284, "percentage": 40.16, "elapsed_time": "3:10:12", "remaining_time": "4:43:21"}
|
| 732 |
+
{"current_steps": 489, "total_steps": 1215, "loss": 0.3331, "lr": 2.986695005724921e-05, "epoch": 2.010277492291881, "percentage": 40.25, "elapsed_time": "3:10:35", "remaining_time": "4:42:58"}
|
| 733 |
+
{"current_steps": 490, "total_steps": 1215, "loss": 0.3318, "lr": 2.9816906462704963e-05, "epoch": 2.014388489208633, "percentage": 40.33, "elapsed_time": "3:10:59", "remaining_time": "4:42:35"}
|
| 734 |
+
{"current_steps": 491, "total_steps": 1215, "loss": 0.331, "lr": 2.9766781765747775e-05, "epoch": 2.0184994861253855, "percentage": 40.41, "elapsed_time": "3:11:23", "remaining_time": "4:42:12"}
|
| 735 |
+
{"current_steps": 492, "total_steps": 1215, "loss": 0.3318, "lr": 2.971657638048302e-05, "epoch": 2.0226104830421376, "percentage": 40.49, "elapsed_time": "3:11:47", "remaining_time": "4:41:49"}
|
| 736 |
+
{"current_steps": 493, "total_steps": 1215, "loss": 0.3344, "lr": 2.966629072168271e-05, "epoch": 2.02672147995889, "percentage": 40.58, "elapsed_time": "3:12:09", "remaining_time": "4:41:25"}
|
| 737 |
+
{"current_steps": 494, "total_steps": 1215, "loss": 0.3177, "lr": 2.9615925204782006e-05, "epoch": 2.0308324768756423, "percentage": 40.66, "elapsed_time": "3:12:32", "remaining_time": "4:41:01"}
|
| 738 |
+
{"current_steps": 495, "total_steps": 1215, "loss": 0.3358, "lr": 2.9565480245875845e-05, "epoch": 2.034943473792395, "percentage": 40.74, "elapsed_time": "3:12:56", "remaining_time": "4:40:37"}
|
| 739 |
+
{"current_steps": 496, "total_steps": 1215, "loss": 0.3303, "lr": 2.9514956261715458e-05, "epoch": 2.039054470709147, "percentage": 40.82, "elapsed_time": "3:13:19", "remaining_time": "4:40:14"}
|
| 740 |
+
{"current_steps": 497, "total_steps": 1215, "loss": 0.3683, "lr": 2.9464353669704943e-05, "epoch": 2.0431654676258995, "percentage": 40.91, "elapsed_time": "3:13:42", "remaining_time": "4:39:50"}
|
| 741 |
+
{"current_steps": 498, "total_steps": 1215, "loss": 0.34, "lr": 2.9413672887897828e-05, "epoch": 2.0472764645426516, "percentage": 40.99, "elapsed_time": "3:14:05", "remaining_time": "4:39:27"}
|
| 742 |
+
{"current_steps": 499, "total_steps": 1215, "loss": 0.3304, "lr": 2.936291433499359e-05, "epoch": 2.051387461459404, "percentage": 41.07, "elapsed_time": "3:14:29", "remaining_time": "4:39:03"}
|
| 743 |
+
{"current_steps": 500, "total_steps": 1215, "loss": 0.3358, "lr": 2.9312078430334228e-05, "epoch": 2.055498458376156, "percentage": 41.15, "elapsed_time": "3:14:52", "remaining_time": "4:38:40"}
|
| 744 |
+
{"current_steps": 501, "total_steps": 1215, "loss": 0.3232, "lr": 2.926116559390078e-05, "epoch": 2.0596094552929087, "percentage": 41.23, "elapsed_time": "3:15:15", "remaining_time": "4:38:16"}
|
| 745 |
+
{"current_steps": 502, "total_steps": 1215, "loss": 0.323, "lr": 2.921017624630984e-05, "epoch": 2.063720452209661, "percentage": 41.32, "elapsed_time": "3:15:39", "remaining_time": "4:37:54"}
|
| 746 |
+
{"current_steps": 503, "total_steps": 1215, "loss": 0.3192, "lr": 2.9159110808810125e-05, "epoch": 2.0678314491264134, "percentage": 41.4, "elapsed_time": "3:16:01", "remaining_time": "4:37:28"}
|
| 747 |
+
{"current_steps": 504, "total_steps": 1215, "loss": 0.3354, "lr": 2.9107969703278952e-05, "epoch": 2.0719424460431655, "percentage": 41.48, "elapsed_time": "3:16:25", "remaining_time": "4:37:05"}
|
| 748 |
+
{"current_steps": 505, "total_steps": 1215, "loss": 0.3299, "lr": 2.905675335221877e-05, "epoch": 2.0760534429599176, "percentage": 41.56, "elapsed_time": "3:16:48", "remaining_time": "4:36:42"}
|
| 749 |
+
{"current_steps": 506, "total_steps": 1215, "loss": 0.3288, "lr": 2.900546217875368e-05, "epoch": 2.08016443987667, "percentage": 41.65, "elapsed_time": "3:17:10", "remaining_time": "4:36:16"}
|
| 750 |
+
{"current_steps": 507, "total_steps": 1215, "loss": 0.3328, "lr": 2.895409660662592e-05, "epoch": 2.084275436793422, "percentage": 41.73, "elapsed_time": "3:17:34", "remaining_time": "4:35:54"}
|
| 751 |
+
{"current_steps": 508, "total_steps": 1215, "loss": 0.3376, "lr": 2.8902657060192366e-05, "epoch": 2.0883864337101747, "percentage": 41.81, "elapsed_time": "3:17:58", "remaining_time": "4:35:31"}
|
| 752 |
+
{"current_steps": 509, "total_steps": 1215, "loss": 0.3356, "lr": 2.8851143964421048e-05, "epoch": 2.092497430626927, "percentage": 41.89, "elapsed_time": "3:18:20", "remaining_time": "4:35:05"}
|
| 753 |
+
{"current_steps": 510, "total_steps": 1215, "loss": 0.332, "lr": 2.879955774488762e-05, "epoch": 2.0966084275436794, "percentage": 41.98, "elapsed_time": "3:18:42", "remaining_time": "4:34:41"}
|
| 754 |
+
{"current_steps": 511, "total_steps": 1215, "loss": 0.3389, "lr": 2.8747898827771846e-05, "epoch": 2.1007194244604315, "percentage": 42.06, "elapsed_time": "3:19:04", "remaining_time": "4:34:15"}
|
| 755 |
+
{"current_steps": 512, "total_steps": 1215, "loss": 0.341, "lr": 2.8696167639854073e-05, "epoch": 2.104830421377184, "percentage": 42.14, "elapsed_time": "3:19:27", "remaining_time": "4:33:52"}
|
| 756 |
+
{"current_steps": 513, "total_steps": 1215, "loss": 0.3299, "lr": 2.864436460851173e-05, "epoch": 2.108941418293936, "percentage": 42.22, "elapsed_time": "3:19:49", "remaining_time": "4:33:26"}
|
| 757 |
+
{"current_steps": 514, "total_steps": 1215, "loss": 0.3191, "lr": 2.8592490161715768e-05, "epoch": 2.1130524152106887, "percentage": 42.3, "elapsed_time": "3:20:11", "remaining_time": "4:33:01"}
|
| 758 |
+
{"current_steps": 515, "total_steps": 1215, "loss": 0.3145, "lr": 2.8540544728027145e-05, "epoch": 2.1171634121274407, "percentage": 42.39, "elapsed_time": "3:20:34", "remaining_time": "4:32:38"}
|
| 759 |
+
{"current_steps": 516, "total_steps": 1215, "loss": 0.3275, "lr": 2.8488528736593278e-05, "epoch": 2.1212744090441933, "percentage": 42.47, "elapsed_time": "3:20:57", "remaining_time": "4:32:13"}
|
| 760 |
+
{"current_steps": 517, "total_steps": 1215, "loss": 0.3384, "lr": 2.843644261714448e-05, "epoch": 2.1253854059609454, "percentage": 42.55, "elapsed_time": "3:21:20", "remaining_time": "4:31:50"}
|
| 761 |
+
{"current_steps": 518, "total_steps": 1215, "loss": 0.3296, "lr": 2.8384286799990452e-05, "epoch": 2.129496402877698, "percentage": 42.63, "elapsed_time": "3:21:42", "remaining_time": "4:31:24"}
|
| 762 |
+
{"current_steps": 519, "total_steps": 1215, "loss": 0.32, "lr": 2.8332061716016692e-05, "epoch": 2.13360739979445, "percentage": 42.72, "elapsed_time": "3:22:05", "remaining_time": "4:31:01"}
|
| 763 |
+
{"current_steps": 520, "total_steps": 1215, "loss": 0.3332, "lr": 2.8279767796680934e-05, "epoch": 2.1377183967112026, "percentage": 42.8, "elapsed_time": "3:22:28", "remaining_time": "4:30:37"}
|
| 764 |
+
{"current_steps": 521, "total_steps": 1215, "loss": 0.325, "lr": 2.8227405474009616e-05, "epoch": 2.1418293936279547, "percentage": 42.88, "elapsed_time": "3:22:51", "remaining_time": "4:30:13"}
|
| 765 |
+
{"current_steps": 522, "total_steps": 1215, "loss": 0.3286, "lr": 2.817497518059428e-05, "epoch": 2.145940390544707, "percentage": 42.96, "elapsed_time": "3:23:15", "remaining_time": "4:29:50"}
|
| 766 |
+
{"current_steps": 523, "total_steps": 1215, "loss": 0.3247, "lr": 2.8122477349588005e-05, "epoch": 2.1500513874614593, "percentage": 43.05, "elapsed_time": "3:23:39", "remaining_time": "4:29:27"}
|
| 767 |
+
{"current_steps": 524, "total_steps": 1215, "loss": 0.3338, "lr": 2.8069912414701842e-05, "epoch": 2.154162384378212, "percentage": 43.13, "elapsed_time": "3:24:01", "remaining_time": "4:29:03"}
|
| 768 |
+
{"current_steps": 525, "total_steps": 1215, "loss": 0.3307, "lr": 2.8017280810201213e-05, "epoch": 2.158273381294964, "percentage": 43.21, "elapsed_time": "3:24:24", "remaining_time": "4:28:39"}
|
| 769 |
+
{"current_steps": 526, "total_steps": 1215, "loss": 0.3263, "lr": 2.7964582970902338e-05, "epoch": 2.1623843782117165, "percentage": 43.29, "elapsed_time": "3:24:47", "remaining_time": "4:28:15"}
|
| 770 |
+
{"current_steps": 527, "total_steps": 1215, "loss": 0.3302, "lr": 2.7911819332168627e-05, "epoch": 2.1664953751284686, "percentage": 43.37, "elapsed_time": "3:25:11", "remaining_time": "4:27:52"}
|
| 771 |
+
{"current_steps": 528, "total_steps": 1215, "loss": 0.3307, "lr": 2.78589903299071e-05, "epoch": 2.170606372045221, "percentage": 43.46, "elapsed_time": "3:25:34", "remaining_time": "4:27:29"}
|
| 772 |
+
{"current_steps": 529, "total_steps": 1215, "loss": 0.3234, "lr": 2.7806096400564775e-05, "epoch": 2.174717368961973, "percentage": 43.54, "elapsed_time": "3:25:57", "remaining_time": "4:27:05"}
|
| 773 |
+
{"current_steps": 530, "total_steps": 1215, "loss": 0.3354, "lr": 2.7753137981125068e-05, "epoch": 2.1788283658787257, "percentage": 43.62, "elapsed_time": "3:26:21", "remaining_time": "4:26:41"}
|
| 774 |
+
{"current_steps": 531, "total_steps": 1215, "loss": 0.336, "lr": 2.7700115509104176e-05, "epoch": 2.182939362795478, "percentage": 43.7, "elapsed_time": "3:26:44", "remaining_time": "4:26:18"}
|
| 775 |
+
{"current_steps": 532, "total_steps": 1215, "loss": 0.3326, "lr": 2.7647029422547465e-05, "epoch": 2.1870503597122304, "percentage": 43.79, "elapsed_time": "3:27:07", "remaining_time": "4:25:55"}
|
| 776 |
+
{"current_steps": 533, "total_steps": 1215, "loss": 0.3354, "lr": 2.7593880160025864e-05, "epoch": 2.1911613566289825, "percentage": 43.87, "elapsed_time": "3:27:29", "remaining_time": "4:25:30"}
|
| 777 |
+
{"current_steps": 534, "total_steps": 1215, "loss": 0.3194, "lr": 2.754066816063222e-05, "epoch": 2.195272353545735, "percentage": 43.95, "elapsed_time": "3:27:53", "remaining_time": "4:25:06"}
|
| 778 |
+
{"current_steps": 535, "total_steps": 1215, "loss": 0.3369, "lr": 2.7487393863977687e-05, "epoch": 2.199383350462487, "percentage": 44.03, "elapsed_time": "3:28:16", "remaining_time": "4:24:43"}
|
| 779 |
+
{"current_steps": 536, "total_steps": 1215, "loss": 0.3157, "lr": 2.7434057710188077e-05, "epoch": 2.2034943473792397, "percentage": 44.12, "elapsed_time": "3:28:39", "remaining_time": "4:24:19"}
|
| 780 |
+
{"current_steps": 537, "total_steps": 1215, "loss": 0.3153, "lr": 2.738066013990025e-05, "epoch": 2.2076053442959918, "percentage": 44.2, "elapsed_time": "3:29:03", "remaining_time": "4:23:56"}
|
| 781 |
+
{"current_steps": 538, "total_steps": 1215, "loss": 0.3296, "lr": 2.732720159425845e-05, "epoch": 2.2117163412127443, "percentage": 44.28, "elapsed_time": "3:29:25", "remaining_time": "4:23:32"}
|
| 782 |
+
{"current_steps": 539, "total_steps": 1215, "loss": 0.3247, "lr": 2.7273682514910668e-05, "epoch": 2.2158273381294964, "percentage": 44.36, "elapsed_time": "3:29:49", "remaining_time": "4:23:09"}
|
| 783 |
+
{"current_steps": 540, "total_steps": 1215, "loss": 0.3293, "lr": 2.7220103344004995e-05, "epoch": 2.2199383350462485, "percentage": 44.44, "elapsed_time": "3:30:12", "remaining_time": "4:22:45"}
|
| 784 |
+
{"current_steps": 541, "total_steps": 1215, "loss": 0.3419, "lr": 2.7166464524185977e-05, "epoch": 2.224049331963001, "percentage": 44.53, "elapsed_time": "3:30:35", "remaining_time": "4:22:22"}
|
| 785 |
+
{"current_steps": 542, "total_steps": 1215, "loss": 0.3277, "lr": 2.7112766498590944e-05, "epoch": 2.2281603288797536, "percentage": 44.61, "elapsed_time": "3:30:58", "remaining_time": "4:21:58"}
|
| 786 |
+
{"current_steps": 543, "total_steps": 1215, "loss": 0.3352, "lr": 2.705900971084635e-05, "epoch": 2.2322713257965057, "percentage": 44.69, "elapsed_time": "3:31:21", "remaining_time": "4:21:34"}
|
| 787 |
+
{"current_steps": 544, "total_steps": 1215, "loss": 0.3334, "lr": 2.7005194605064122e-05, "epoch": 2.2363823227132578, "percentage": 44.77, "elapsed_time": "3:31:44", "remaining_time": "4:21:11"}
|