sedrickkeh commited on
Commit
63c22e9
·
verified ·
1 Parent(s): 77f6b00

Training in progress, epoch 4

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:016c8b67370f54adeea3971a528165bac109770d965c5eb8bd7caa292a2fc3c2
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d49ad30bcd6ad70aedc18fc8e27452edc708711851da4798b32cc418096753d
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9c8b29f21ad8da68d2bfa523ab246f3df6a8f72b241362b8cd77f672173a13e4
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cbef6f6bca0cc4b1f1b466aff2750ed5a791bf45b69f45c1abb2a0145ee319bf
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5327118af3f2d74b3bb57501805d9caf7b38d4828193637dd00cee3dbaf623f6
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7658a695fae6c7a1d9b86ff973691a21f23093721a9cec921cf205e7ef20210d
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8adae781a2fc2d988086caf80c135c8344f9ba21271ce2db5efcafae98c8c54
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25a2acb4040aaa99033ca6d314f3872941e3ed125e2a024f0ae133bb93983380
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -499,3 +499,128 @@
499
  {"current_steps": 499, "total_steps": 625, "loss": 0.4066, "lr": 9.518509952841586e-06, "epoch": 3.9860209685471792, "percentage": 79.84, "elapsed_time": "21:19:49", "remaining_time": "5:23:09"}
500
  {"current_steps": 500, "total_steps": 625, "loss": 0.4039, "lr": 9.374197950119726e-06, "epoch": 3.9940089865202197, "percentage": 80.0, "elapsed_time": "21:22:21", "remaining_time": "5:20:35"}
501
  {"current_steps": 501, "total_steps": 625, "loss": 0.7111, "lr": 9.230842950740002e-06, "epoch": 4.00199700449326, "percentage": 80.16, "elapsed_time": "21:26:30", "remaining_time": "5:18:25"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
499
  {"current_steps": 499, "total_steps": 625, "loss": 0.4066, "lr": 9.518509952841586e-06, "epoch": 3.9860209685471792, "percentage": 79.84, "elapsed_time": "21:19:49", "remaining_time": "5:23:09"}
500
  {"current_steps": 500, "total_steps": 625, "loss": 0.4039, "lr": 9.374197950119726e-06, "epoch": 3.9940089865202197, "percentage": 80.0, "elapsed_time": "21:22:21", "remaining_time": "5:20:35"}
501
  {"current_steps": 501, "total_steps": 625, "loss": 0.7111, "lr": 9.230842950740002e-06, "epoch": 4.00199700449326, "percentage": 80.16, "elapsed_time": "21:26:30", "remaining_time": "5:18:25"}
502
+ {"current_steps": 502, "total_steps": 625, "loss": 0.3809, "lr": 9.088449434298204e-06, "epoch": 4.0099850224663, "percentage": 80.32, "elapsed_time": "21:29:03", "remaining_time": "5:15:50"}
503
+ {"current_steps": 503, "total_steps": 625, "loss": 0.3726, "lr": 8.947021850345398e-06, "epoch": 4.017973040439341, "percentage": 80.48, "elapsed_time": "21:31:36", "remaining_time": "5:13:16"}
504
+ {"current_steps": 504, "total_steps": 625, "loss": 0.3808, "lr": 8.806564618248999e-06, "epoch": 4.025961058412381, "percentage": 80.64, "elapsed_time": "21:34:09", "remaining_time": "5:10:42"}
505
+ {"current_steps": 505, "total_steps": 625, "loss": 0.3832, "lr": 8.667082127054533e-06, "epoch": 4.033949076385422, "percentage": 80.8, "elapsed_time": "21:36:42", "remaining_time": "5:08:07"}
506
+ {"current_steps": 506, "total_steps": 625, "loss": 0.3779, "lr": 8.52857873534862e-06, "epoch": 4.041937094358462, "percentage": 80.96, "elapsed_time": "21:39:15", "remaining_time": "5:05:33"}
507
+ {"current_steps": 507, "total_steps": 625, "loss": 0.3831, "lr": 8.391058771122673e-06, "epoch": 4.049925112331502, "percentage": 81.12, "elapsed_time": "21:41:49", "remaining_time": "5:02:59"}
508
+ {"current_steps": 508, "total_steps": 625, "loss": 0.3874, "lr": 8.254526531637727e-06, "epoch": 4.057913130304543, "percentage": 81.28, "elapsed_time": "21:44:21", "remaining_time": "5:00:24"}
509
+ {"current_steps": 509, "total_steps": 625, "loss": 0.3873, "lr": 8.118986283290096e-06, "epoch": 4.065901148277583, "percentage": 81.44, "elapsed_time": "21:46:54", "remaining_time": "4:57:50"}
510
+ {"current_steps": 510, "total_steps": 625, "loss": 0.3779, "lr": 7.984442261478108e-06, "epoch": 4.073889166250624, "percentage": 81.6, "elapsed_time": "21:49:28", "remaining_time": "4:55:16"}
511
+ {"current_steps": 511, "total_steps": 625, "loss": 0.3796, "lr": 7.850898670469745e-06, "epoch": 4.081877184223664, "percentage": 81.76, "elapsed_time": "21:52:01", "remaining_time": "4:52:42"}
512
+ {"current_steps": 512, "total_steps": 625, "loss": 0.3801, "lr": 7.718359683271224e-06, "epoch": 4.089865202196705, "percentage": 81.92, "elapsed_time": "21:54:34", "remaining_time": "4:50:07"}
513
+ {"current_steps": 513, "total_steps": 625, "loss": 0.3692, "lr": 7.586829441496668e-06, "epoch": 4.097853220169745, "percentage": 82.08, "elapsed_time": "21:57:07", "remaining_time": "4:47:33"}
514
+ {"current_steps": 514, "total_steps": 625, "loss": 0.3792, "lr": 7.456312055238606e-06, "epoch": 4.105841238142786, "percentage": 82.24, "elapsed_time": "21:59:40", "remaining_time": "4:44:59"}
515
+ {"current_steps": 515, "total_steps": 625, "loss": 0.3825, "lr": 7.326811602939634e-06, "epoch": 4.113829256115826, "percentage": 82.4, "elapsed_time": "22:02:13", "remaining_time": "4:42:24"}
516
+ {"current_steps": 516, "total_steps": 625, "loss": 0.3827, "lr": 7.198332131264876e-06, "epoch": 4.121817274088866, "percentage": 82.56, "elapsed_time": "22:04:45", "remaining_time": "4:39:50"}
517
+ {"current_steps": 517, "total_steps": 625, "loss": 0.3858, "lr": 7.070877654975614e-06, "epoch": 4.129805292061907, "percentage": 82.72, "elapsed_time": "22:07:17", "remaining_time": "4:37:16"}
518
+ {"current_steps": 518, "total_steps": 625, "loss": 0.3763, "lr": 6.944452156803763e-06, "epoch": 4.137793310034947, "percentage": 82.88, "elapsed_time": "22:09:50", "remaining_time": "4:34:41"}
519
+ {"current_steps": 519, "total_steps": 625, "loss": 0.3798, "lr": 6.819059587327479e-06, "epoch": 4.145781328007988, "percentage": 83.04, "elapsed_time": "22:12:25", "remaining_time": "4:32:07"}
520
+ {"current_steps": 520, "total_steps": 625, "loss": 0.3812, "lr": 6.694703864847673e-06, "epoch": 4.153769345981028, "percentage": 83.2, "elapsed_time": "22:14:59", "remaining_time": "4:29:33"}
521
+ {"current_steps": 521, "total_steps": 625, "loss": 0.3804, "lr": 6.571388875265592e-06, "epoch": 4.161757363954069, "percentage": 83.36, "elapsed_time": "22:17:35", "remaining_time": "4:27:00"}
522
+ {"current_steps": 522, "total_steps": 625, "loss": 0.3815, "lr": 6.449118471961342e-06, "epoch": 4.169745381927109, "percentage": 83.52, "elapsed_time": "22:20:09", "remaining_time": "4:24:26"}
523
+ {"current_steps": 523, "total_steps": 625, "loss": 0.3796, "lr": 6.327896475673561e-06, "epoch": 4.177733399900149, "percentage": 83.68, "elapsed_time": "22:22:42", "remaining_time": "4:21:52"}
524
+ {"current_steps": 524, "total_steps": 625, "loss": 0.3802, "lr": 6.207726674379961e-06, "epoch": 4.18572141787319, "percentage": 83.84, "elapsed_time": "22:25:15", "remaining_time": "4:19:17"}
525
+ {"current_steps": 525, "total_steps": 625, "loss": 0.3752, "lr": 6.088612823178968e-06, "epoch": 4.19370943584623, "percentage": 84.0, "elapsed_time": "22:27:47", "remaining_time": "4:16:43"}
526
+ {"current_steps": 526, "total_steps": 625, "loss": 0.3772, "lr": 5.970558644172424e-06, "epoch": 4.201697453819271, "percentage": 84.16, "elapsed_time": "22:30:20", "remaining_time": "4:14:09"}
527
+ {"current_steps": 527, "total_steps": 625, "loss": 0.3738, "lr": 5.853567826349213e-06, "epoch": 4.209685471792311, "percentage": 84.32, "elapsed_time": "22:32:53", "remaining_time": "4:11:34"}
528
+ {"current_steps": 528, "total_steps": 625, "loss": 0.3752, "lr": 5.737644025470057e-06, "epoch": 4.217673489765352, "percentage": 84.48, "elapsed_time": "22:35:25", "remaining_time": "4:09:00"}
529
+ {"current_steps": 529, "total_steps": 625, "loss": 0.3822, "lr": 5.6227908639532045e-06, "epoch": 4.225661507738392, "percentage": 84.64, "elapsed_time": "22:37:58", "remaining_time": "4:06:26"}
530
+ {"current_steps": 530, "total_steps": 625, "loss": 0.381, "lr": 5.509011930761308e-06, "epoch": 4.233649525711433, "percentage": 84.8, "elapsed_time": "22:40:31", "remaining_time": "4:03:52"}
531
+ {"current_steps": 531, "total_steps": 625, "loss": 0.3816, "lr": 5.396310781289243e-06, "epoch": 4.241637543684473, "percentage": 84.96, "elapsed_time": "22:43:04", "remaining_time": "4:01:17"}
532
+ {"current_steps": 532, "total_steps": 625, "loss": 0.3696, "lr": 5.284690937252977e-06, "epoch": 4.249625561657513, "percentage": 85.12, "elapsed_time": "22:45:37", "remaining_time": "3:58:43"}
533
+ {"current_steps": 533, "total_steps": 625, "loss": 0.3859, "lr": 5.1741558865795906e-06, "epoch": 4.257613579630554, "percentage": 85.28, "elapsed_time": "22:48:10", "remaining_time": "3:56:09"}
534
+ {"current_steps": 534, "total_steps": 625, "loss": 0.3822, "lr": 5.064709083298214e-06, "epoch": 4.265601597603594, "percentage": 85.44, "elapsed_time": "22:50:43", "remaining_time": "3:53:35"}
535
+ {"current_steps": 535, "total_steps": 625, "loss": 0.3782, "lr": 4.95635394743216e-06, "epoch": 4.273589615576635, "percentage": 85.6, "elapsed_time": "22:53:16", "remaining_time": "3:51:01"}
536
+ {"current_steps": 536, "total_steps": 625, "loss": 0.3822, "lr": 4.849093864891994e-06, "epoch": 4.281577633549675, "percentage": 85.76, "elapsed_time": "22:55:48", "remaining_time": "3:48:26"}
537
+ {"current_steps": 537, "total_steps": 625, "loss": 0.3783, "lr": 4.7429321873697865e-06, "epoch": 4.289565651522716, "percentage": 85.92, "elapsed_time": "22:58:21", "remaining_time": "3:45:52"}
538
+ {"current_steps": 538, "total_steps": 625, "loss": 0.3805, "lr": 4.637872232234326e-06, "epoch": 4.297553669495756, "percentage": 86.08, "elapsed_time": "23:00:55", "remaining_time": "3:43:18"}
539
+ {"current_steps": 539, "total_steps": 625, "loss": 0.3795, "lr": 4.5339172824274955e-06, "epoch": 4.305541687468796, "percentage": 86.24, "elapsed_time": "23:03:27", "remaining_time": "3:40:44"}
540
+ {"current_steps": 540, "total_steps": 625, "loss": 0.3794, "lr": 4.4310705863616835e-06, "epoch": 4.313529705441837, "percentage": 86.4, "elapsed_time": "23:06:00", "remaining_time": "3:38:10"}
541
+ {"current_steps": 541, "total_steps": 625, "loss": 0.3759, "lr": 4.329335357818236e-06, "epoch": 4.321517723414877, "percentage": 86.56, "elapsed_time": "23:08:34", "remaining_time": "3:35:36"}
542
+ {"current_steps": 542, "total_steps": 625, "loss": 0.3877, "lr": 4.228714775847084e-06, "epoch": 4.329505741387918, "percentage": 86.72, "elapsed_time": "23:11:06", "remaining_time": "3:33:01"}
543
+ {"current_steps": 543, "total_steps": 625, "loss": 0.3803, "lr": 4.129211984667385e-06, "epoch": 4.337493759360958, "percentage": 86.88, "elapsed_time": "23:13:39", "remaining_time": "3:30:27"}
544
+ {"current_steps": 544, "total_steps": 625, "loss": 0.3764, "lr": 4.030830093569247e-06, "epoch": 4.345481777333999, "percentage": 87.04, "elapsed_time": "23:16:11", "remaining_time": "3:27:53"}
545
+ {"current_steps": 545, "total_steps": 625, "loss": 0.3818, "lr": 3.933572176816602e-06, "epoch": 4.353469795307039, "percentage": 87.2, "elapsed_time": "23:18:44", "remaining_time": "3:25:19"}
546
+ {"current_steps": 546, "total_steps": 625, "loss": 0.3749, "lr": 3.837441273551137e-06, "epoch": 4.361457813280079, "percentage": 87.36, "elapsed_time": "23:21:17", "remaining_time": "3:22:45"}
547
+ {"current_steps": 547, "total_steps": 625, "loss": 0.3741, "lr": 3.7424403876972924e-06, "epoch": 4.36944583125312, "percentage": 87.52, "elapsed_time": "23:23:50", "remaining_time": "3:20:10"}
548
+ {"current_steps": 548, "total_steps": 625, "loss": 0.3889, "lr": 3.6485724878684382e-06, "epoch": 4.37743384922616, "percentage": 87.68, "elapsed_time": "23:26:22", "remaining_time": "3:17:36"}
549
+ {"current_steps": 549, "total_steps": 625, "loss": 0.3788, "lr": 3.555840507274093e-06, "epoch": 4.385421867199201, "percentage": 87.84, "elapsed_time": "23:28:56", "remaining_time": "3:15:02"}
550
+ {"current_steps": 550, "total_steps": 625, "loss": 0.3833, "lr": 3.464247343628242e-06, "epoch": 4.393409885172241, "percentage": 88.0, "elapsed_time": "23:31:29", "remaining_time": "3:12:28"}
551
+ {"current_steps": 551, "total_steps": 625, "loss": 0.3756, "lr": 3.373795859058837e-06, "epoch": 4.401397903145282, "percentage": 88.16, "elapsed_time": "23:34:01", "remaining_time": "3:09:54"}
552
+ {"current_steps": 552, "total_steps": 625, "loss": 0.3809, "lr": 3.284488880018315e-06, "epoch": 4.409385921118322, "percentage": 88.32, "elapsed_time": "23:36:34", "remaining_time": "3:07:20"}
553
+ {"current_steps": 553, "total_steps": 625, "loss": 0.379, "lr": 3.196329197195307e-06, "epoch": 4.417373939091363, "percentage": 88.48, "elapsed_time": "23:39:07", "remaining_time": "3:04:46"}
554
+ {"current_steps": 554, "total_steps": 625, "loss": 0.3844, "lr": 3.1093195654274024e-06, "epoch": 4.425361957064403, "percentage": 88.64, "elapsed_time": "23:41:40", "remaining_time": "3:02:12"}
555
+ {"current_steps": 555, "total_steps": 625, "loss": 0.3754, "lr": 3.0234627036151186e-06, "epoch": 4.433349975037443, "percentage": 88.8, "elapsed_time": "23:44:13", "remaining_time": "2:59:37"}
556
+ {"current_steps": 556, "total_steps": 625, "loss": 0.3767, "lr": 2.9387612946368647e-06, "epoch": 4.441337993010484, "percentage": 88.96, "elapsed_time": "23:46:45", "remaining_time": "2:57:03"}
557
+ {"current_steps": 557, "total_steps": 625, "loss": 0.3818, "lr": 2.855217985265184e-06, "epoch": 4.449326010983524, "percentage": 89.12, "elapsed_time": "23:49:18", "remaining_time": "2:54:29"}
558
+ {"current_steps": 558, "total_steps": 625, "loss": 0.3789, "lr": 2.7728353860839763e-06, "epoch": 4.457314028956565, "percentage": 89.28, "elapsed_time": "23:51:51", "remaining_time": "2:51:55"}
559
+ {"current_steps": 559, "total_steps": 625, "loss": 0.3721, "lr": 2.6916160714069817e-06, "epoch": 4.465302046929605, "percentage": 89.44, "elapsed_time": "23:54:23", "remaining_time": "2:49:21"}
560
+ {"current_steps": 560, "total_steps": 625, "loss": 0.3777, "lr": 2.6115625791973155e-06, "epoch": 4.473290064902646, "percentage": 89.6, "elapsed_time": "23:56:56", "remaining_time": "2:46:47"}
561
+ {"current_steps": 561, "total_steps": 625, "loss": 0.3805, "lr": 2.5326774109881223e-06, "epoch": 4.481278082875686, "percentage": 89.76, "elapsed_time": "23:59:29", "remaining_time": "2:44:13"}
562
+ {"current_steps": 562, "total_steps": 625, "loss": 0.3746, "lr": 2.454963031804485e-06, "epoch": 4.489266100848727, "percentage": 89.92, "elapsed_time": "1 day, 0:02:02", "remaining_time": "2:41:39"}
563
+ {"current_steps": 563, "total_steps": 625, "loss": 0.3761, "lr": 2.378421870086314e-06, "epoch": 4.497254118821767, "percentage": 90.08, "elapsed_time": "1 day, 0:04:35", "remaining_time": "2:39:05"}
564
+ {"current_steps": 564, "total_steps": 625, "loss": 0.3738, "lr": 2.3030563176125444e-06, "epoch": 4.5052421367948075, "percentage": 90.24, "elapsed_time": "1 day, 0:07:08", "remaining_time": "2:36:31"}
565
+ {"current_steps": 565, "total_steps": 625, "loss": 0.3765, "lr": 2.228868729426319e-06, "epoch": 4.513230154767848, "percentage": 90.4, "elapsed_time": "1 day, 0:09:41", "remaining_time": "2:33:56"}
566
+ {"current_steps": 566, "total_steps": 625, "loss": 0.3778, "lr": 2.1558614237614516e-06, "epoch": 4.521218172740888, "percentage": 90.56, "elapsed_time": "1 day, 0:12:14", "remaining_time": "2:31:22"}
567
+ {"current_steps": 567, "total_steps": 625, "loss": 0.3857, "lr": 2.0840366819699788e-06, "epoch": 4.529206190713929, "percentage": 90.72, "elapsed_time": "1 day, 0:14:46", "remaining_time": "2:28:48"}
568
+ {"current_steps": 568, "total_steps": 625, "loss": 0.3761, "lr": 2.013396748450842e-06, "epoch": 4.537194208686969, "percentage": 90.88, "elapsed_time": "1 day, 0:17:20", "remaining_time": "2:26:14"}
569
+ {"current_steps": 569, "total_steps": 625, "loss": 0.3756, "lr": 1.9439438305797776e-06, "epoch": 4.54518222666001, "percentage": 91.04, "elapsed_time": "1 day, 0:19:54", "remaining_time": "2:23:40"}
570
+ {"current_steps": 570, "total_steps": 625, "loss": 0.3782, "lr": 1.8756800986403466e-06, "epoch": 4.55317024463305, "percentage": 91.2, "elapsed_time": "1 day, 0:22:29", "remaining_time": "2:21:07"}
571
+ {"current_steps": 571, "total_steps": 625, "loss": 0.3776, "lr": 1.808607685756103e-06, "epoch": 4.5611582626060905, "percentage": 91.36, "elapsed_time": "1 day, 0:25:02", "remaining_time": "2:18:32"}
572
+ {"current_steps": 572, "total_steps": 625, "loss": 0.3713, "lr": 1.7427286878239247e-06, "epoch": 4.569146280579131, "percentage": 91.52, "elapsed_time": "1 day, 0:27:38", "remaining_time": "2:15:59"}
573
+ {"current_steps": 573, "total_steps": 625, "loss": 0.3781, "lr": 1.6780451634485606e-06, "epoch": 4.5771342985521715, "percentage": 91.68, "elapsed_time": "1 day, 0:30:12", "remaining_time": "2:13:25"}
574
+ {"current_steps": 574, "total_steps": 625, "loss": 0.3822, "lr": 1.614559133878264e-06, "epoch": 4.585122316525212, "percentage": 91.84, "elapsed_time": "1 day, 0:32:47", "remaining_time": "2:10:51"}
575
+ {"current_steps": 575, "total_steps": 625, "loss": 0.3789, "lr": 1.5522725829416474e-06, "epoch": 4.5931103344982525, "percentage": 92.0, "elapsed_time": "1 day, 0:35:20", "remaining_time": "2:08:17"}
576
+ {"current_steps": 576, "total_steps": 625, "loss": 0.3777, "lr": 1.4911874569856965e-06, "epoch": 4.601098352471293, "percentage": 92.16, "elapsed_time": "1 day, 0:37:55", "remaining_time": "2:05:43"}
577
+ {"current_steps": 577, "total_steps": 625, "loss": 0.3818, "lr": 1.4313056648149393e-06, "epoch": 4.6090863704443334, "percentage": 92.32, "elapsed_time": "1 day, 0:40:29", "remaining_time": "2:03:09"}
578
+ {"current_steps": 578, "total_steps": 625, "loss": 0.3752, "lr": 1.3726290776318175e-06, "epoch": 4.6170743884173735, "percentage": 92.48, "elapsed_time": "1 day, 0:43:03", "remaining_time": "2:00:35"}
579
+ {"current_steps": 579, "total_steps": 625, "loss": 0.3846, "lr": 1.3151595289781738e-06, "epoch": 4.625062406390414, "percentage": 92.64, "elapsed_time": "1 day, 0:45:35", "remaining_time": "1:58:01"}
580
+ {"current_steps": 580, "total_steps": 625, "loss": 0.3884, "lr": 1.2588988146780135e-06, "epoch": 4.6330504243634545, "percentage": 92.8, "elapsed_time": "1 day, 0:48:09", "remaining_time": "1:55:27"}
581
+ {"current_steps": 581, "total_steps": 625, "loss": 0.3841, "lr": 1.2038486927813354e-06, "epoch": 4.641038442336495, "percentage": 92.96, "elapsed_time": "1 day, 0:50:42", "remaining_time": "1:52:53"}
582
+ {"current_steps": 582, "total_steps": 625, "loss": 0.3812, "lr": 1.1500108835092472e-06, "epoch": 4.6490264603095355, "percentage": 93.12, "elapsed_time": "1 day, 0:53:14", "remaining_time": "1:50:19"}
583
+ {"current_steps": 583, "total_steps": 625, "loss": 0.3792, "lr": 1.0973870692001554e-06, "epoch": 4.657014478282576, "percentage": 93.28, "elapsed_time": "1 day, 0:55:48", "remaining_time": "1:47:45"}
584
+ {"current_steps": 584, "total_steps": 625, "loss": 0.3843, "lr": 1.0459788942572423e-06, "epoch": 4.6650024962556165, "percentage": 93.44, "elapsed_time": "1 day, 0:58:21", "remaining_time": "1:45:11"}
585
+ {"current_steps": 585, "total_steps": 625, "loss": 0.3857, "lr": 9.957879650970549e-07, "epoch": 4.6729905142286565, "percentage": 93.6, "elapsed_time": "1 day, 1:00:54", "remaining_time": "1:42:37"}
586
+ {"current_steps": 586, "total_steps": 625, "loss": 0.3874, "lr": 9.468158500993207e-07, "epoch": 4.6809785322016975, "percentage": 93.76, "elapsed_time": "1 day, 1:03:26", "remaining_time": "1:40:03"}
587
+ {"current_steps": 587, "total_steps": 625, "loss": 0.3808, "lr": 8.990640795579186e-07, "epoch": 4.6889665501747375, "percentage": 93.92, "elapsed_time": "1 day, 1:05:59", "remaining_time": "1:37:29"}
588
+ {"current_steps": 588, "total_steps": 625, "loss": 0.3727, "lr": 8.525341456330883e-07, "epoch": 4.6969545681477785, "percentage": 94.08, "elapsed_time": "1 day, 1:08:32", "remaining_time": "1:34:55"}
589
+ {"current_steps": 589, "total_steps": 625, "loss": 0.3761, "lr": 8.072275023047926e-07, "epoch": 4.7049425861208185, "percentage": 94.24, "elapsed_time": "1 day, 1:11:05", "remaining_time": "1:32:21"}
590
+ {"current_steps": 590, "total_steps": 625, "loss": 0.3832, "lr": 7.631455653272613e-07, "epoch": 4.712930604093859, "percentage": 94.4, "elapsed_time": "1 day, 1:13:38", "remaining_time": "1:29:47"}
591
+ {"current_steps": 591, "total_steps": 625, "loss": 0.3749, "lr": 7.202897121847852e-07, "epoch": 4.7209186220668995, "percentage": 94.56, "elapsed_time": "1 day, 1:16:10", "remaining_time": "1:27:13"}
592
+ {"current_steps": 592, "total_steps": 625, "loss": 0.3742, "lr": 6.786612820486449e-07, "epoch": 4.72890664003994, "percentage": 94.72, "elapsed_time": "1 day, 1:18:43", "remaining_time": "1:24:39"}
593
+ {"current_steps": 593, "total_steps": 625, "loss": 0.383, "lr": 6.382615757352817e-07, "epoch": 4.7368946580129805, "percentage": 94.88, "elapsed_time": "1 day, 1:21:16", "remaining_time": "1:22:05"}
594
+ {"current_steps": 594, "total_steps": 625, "loss": 0.3802, "lr": 5.990918556656411e-07, "epoch": 4.744882675986021, "percentage": 95.04, "elapsed_time": "1 day, 1:23:51", "remaining_time": "1:19:31"}
595
+ {"current_steps": 595, "total_steps": 625, "loss": 0.3826, "lr": 5.611533458257245e-07, "epoch": 4.7528706939590615, "percentage": 95.2, "elapsed_time": "1 day, 1:26:25", "remaining_time": "1:16:57"}
596
+ {"current_steps": 596, "total_steps": 625, "loss": 0.375, "lr": 5.2444723172834e-07, "epoch": 4.7608587119321015, "percentage": 95.36, "elapsed_time": "1 day, 1:28:57", "remaining_time": "1:14:23"}
597
+ {"current_steps": 597, "total_steps": 625, "loss": 0.3841, "lr": 4.889746603760693e-07, "epoch": 4.7688467299051425, "percentage": 95.52, "elapsed_time": "1 day, 1:31:30", "remaining_time": "1:11:49"}
598
+ {"current_steps": 598, "total_steps": 625, "loss": 0.3753, "lr": 4.5473674022541213e-07, "epoch": 4.7768347478781825, "percentage": 95.68, "elapsed_time": "1 day, 1:34:03", "remaining_time": "1:09:15"}
599
+ {"current_steps": 599, "total_steps": 625, "loss": 0.3838, "lr": 4.2173454115214783e-07, "epoch": 4.7848227658512235, "percentage": 95.84, "elapsed_time": "1 day, 1:36:35", "remaining_time": "1:06:41"}
600
+ {"current_steps": 600, "total_steps": 625, "loss": 0.3765, "lr": 3.899690944179257e-07, "epoch": 4.7928107838242635, "percentage": 96.0, "elapsed_time": "1 day, 1:39:08", "remaining_time": "1:04:07"}
601
+ {"current_steps": 601, "total_steps": 625, "loss": 0.3834, "lr": 3.5944139263800694e-07, "epoch": 4.8007988017973044, "percentage": 96.16, "elapsed_time": "1 day, 1:41:41", "remaining_time": "1:01:33"}
602
+ {"current_steps": 602, "total_steps": 625, "loss": 0.3694, "lr": 3.3015238975026675e-07, "epoch": 4.8087868197703445, "percentage": 96.32, "elapsed_time": "1 day, 1:44:14", "remaining_time": "0:58:59"}
603
+ {"current_steps": 603, "total_steps": 625, "loss": 0.3783, "lr": 3.021030009853876e-07, "epoch": 4.8167748377433846, "percentage": 96.48, "elapsed_time": "1 day, 1:46:47", "remaining_time": "0:56:26"}
604
+ {"current_steps": 604, "total_steps": 625, "loss": 0.3773, "lr": 2.752941028382594e-07, "epoch": 4.8247628557164255, "percentage": 96.64, "elapsed_time": "1 day, 1:49:19", "remaining_time": "0:53:52"}
605
+ {"current_steps": 605, "total_steps": 625, "loss": 0.3777, "lr": 2.4972653304057073e-07, "epoch": 4.8327508736894655, "percentage": 96.8, "elapsed_time": "1 day, 1:51:54", "remaining_time": "0:51:18"}
606
+ {"current_steps": 606, "total_steps": 625, "loss": 0.3808, "lr": 2.25401090534656e-07, "epoch": 4.8407388916625065, "percentage": 96.96, "elapsed_time": "1 day, 1:54:26", "remaining_time": "0:48:44"}
607
+ {"current_steps": 607, "total_steps": 625, "loss": 0.3744, "lr": 2.0231853544852465e-07, "epoch": 4.8487269096355465, "percentage": 97.12, "elapsed_time": "1 day, 1:56:59", "remaining_time": "0:46:10"}
608
+ {"current_steps": 608, "total_steps": 625, "loss": 0.3825, "lr": 1.8047958907209339e-07, "epoch": 4.8567149276085875, "percentage": 97.28, "elapsed_time": "1 day, 1:59:32", "remaining_time": "0:43:36"}
609
+ {"current_steps": 609, "total_steps": 625, "loss": 0.3749, "lr": 1.5988493383466198e-07, "epoch": 4.8647029455816275, "percentage": 97.44, "elapsed_time": "1 day, 2:02:05", "remaining_time": "0:41:02"}
610
+ {"current_steps": 610, "total_steps": 625, "loss": 0.3748, "lr": 1.40535213283588e-07, "epoch": 4.872690963554668, "percentage": 97.6, "elapsed_time": "1 day, 2:04:38", "remaining_time": "0:38:28"}
611
+ {"current_steps": 611, "total_steps": 625, "loss": 0.3819, "lr": 1.2243103206417418e-07, "epoch": 4.8806789815277085, "percentage": 97.76, "elapsed_time": "1 day, 2:07:11", "remaining_time": "0:35:54"}
612
+ {"current_steps": 612, "total_steps": 625, "loss": 0.3827, "lr": 1.05572955900759e-07, "epoch": 4.888666999500749, "percentage": 97.92, "elapsed_time": "1 day, 2:09:43", "remaining_time": "0:33:20"}
613
+ {"current_steps": 613, "total_steps": 625, "loss": 0.3674, "lr": 8.996151157907306e-08, "epoch": 4.8966550174737895, "percentage": 98.08, "elapsed_time": "1 day, 2:12:16", "remaining_time": "0:30:46"}
614
+ {"current_steps": 614, "total_steps": 625, "loss": 0.3755, "lr": 7.559718692974116e-08, "epoch": 4.90464303544683, "percentage": 98.24, "elapsed_time": "1 day, 2:14:48", "remaining_time": "0:28:12"}
615
+ {"current_steps": 615, "total_steps": 625, "loss": 0.3848, "lr": 6.248043081307664e-08, "epoch": 4.9126310534198705, "percentage": 98.4, "elapsed_time": "1 day, 2:17:22", "remaining_time": "0:25:38"}
616
+ {"current_steps": 616, "total_steps": 625, "loss": 0.3754, "lr": 5.0611653105003824e-08, "epoch": 4.9206190713929105, "percentage": 98.56, "elapsed_time": "1 day, 2:19:55", "remaining_time": "0:23:05"}
617
+ {"current_steps": 617, "total_steps": 625, "loss": 0.384, "lr": 3.99912246843126e-08, "epoch": 4.928607089365951, "percentage": 98.72, "elapsed_time": "1 day, 2:22:29", "remaining_time": "0:20:31"}
618
+ {"current_steps": 618, "total_steps": 625, "loss": 0.3797, "lr": 3.061947742101001e-08, "epoch": 4.9365951073389915, "percentage": 98.88, "elapsed_time": "1 day, 2:25:01", "remaining_time": "0:17:57"}
619
+ {"current_steps": 619, "total_steps": 625, "loss": 0.378, "lr": 2.2496704165995142e-08, "epoch": 4.944583125312032, "percentage": 99.04, "elapsed_time": "1 day, 2:27:34", "remaining_time": "0:15:23"}
620
+ {"current_steps": 620, "total_steps": 625, "loss": 0.3804, "lr": 1.5623158741884247e-08, "epoch": 4.9525711432850725, "percentage": 99.2, "elapsed_time": "1 day, 2:30:07", "remaining_time": "0:12:49"}
621
+ {"current_steps": 621, "total_steps": 625, "loss": 0.3661, "lr": 9.999055935074887e-09, "epoch": 4.960559161258113, "percentage": 99.36, "elapsed_time": "1 day, 2:32:40", "remaining_time": "0:10:15"}
622
+ {"current_steps": 622, "total_steps": 625, "loss": 0.3829, "lr": 5.624571489053488e-09, "epoch": 4.9685471792311535, "percentage": 99.52, "elapsed_time": "1 day, 2:35:13", "remaining_time": "0:07:41"}
623
+ {"current_steps": 623, "total_steps": 625, "loss": 0.3842, "lr": 2.499842098901972e-09, "epoch": 4.976535197204194, "percentage": 99.68, "elapsed_time": "1 day, 2:37:47", "remaining_time": "0:05:07"}
624
+ {"current_steps": 624, "total_steps": 625, "loss": 0.3817, "lr": 6.249654069989674e-10, "epoch": 4.9845232151772345, "percentage": 99.84, "elapsed_time": "1 day, 2:40:21", "remaining_time": "0:02:33"}
625
+ {"current_steps": 625, "total_steps": 625, "loss": 0.377, "lr": 0.0, "epoch": 4.992511233150275, "percentage": 100.0, "elapsed_time": "1 day, 2:42:53", "remaining_time": "0:00:00"}
626
+ {"current_steps": 625, "total_steps": 625, "epoch": 4.992511233150275, "percentage": 100.0, "elapsed_time": "1 day, 2:44:25", "remaining_time": "0:00:00"}