neginr commited on
Commit
8da04ac
·
verified ·
1 Parent(s): da190e3

Training in progress, epoch 2

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dcf886e574cf3c5ade47e3fe90e19434060308f67a480561e0ef29823882b4ff
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:086e5d8f946950a9ec6b6f434afb4b1af96440c0d83f1ed98441fd3046c9803a
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c1ef1d5ca3e51f84cdabcc380149fad591d28c4424d805d96da9e1755f9827f3
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:46a53000d9f0db356b3bf5110c401b4e493b1f0a76b2c3b328edd6d494b3f100
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d71a1be8d778fdc50e2d81f28e2ab32a3e4f8fd8431ecdf6589858899ef59c60
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96a46931a03fb493cf5057e4bcc8501c45d952f736814cc0f83def7de5cbf9ca
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3497f55ebcdf68b359acaf9e96bef066a06e171174ae1114e7f771376738f0db
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:40495a184f4fd841420323aff04d1aa4f7945d98b89a90451472fb8ac59bfe74
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -496,3 +496,248 @@
496
  {"current_steps": 496, "total_steps": 1230, "loss": 0.375, "lr": 2.980274210295326e-05, "epoch": 2.0151898734177216, "percentage": 40.33, "elapsed_time": "4:25:58", "remaining_time": "6:33:35"}
497
  {"current_steps": 497, "total_steps": 1230, "loss": 0.3918, "lr": 2.9753229259313578e-05, "epoch": 2.019240506329114, "percentage": 40.41, "elapsed_time": "4:26:25", "remaining_time": "6:32:56"}
498
  {"current_steps": 498, "total_steps": 1230, "loss": 0.3742, "lr": 2.9703637864506274e-05, "epoch": 2.023291139240506, "percentage": 40.49, "elapsed_time": "4:26:53", "remaining_time": "6:32:17"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
496
  {"current_steps": 496, "total_steps": 1230, "loss": 0.375, "lr": 2.980274210295326e-05, "epoch": 2.0151898734177216, "percentage": 40.33, "elapsed_time": "4:25:58", "remaining_time": "6:33:35"}
497
  {"current_steps": 497, "total_steps": 1230, "loss": 0.3918, "lr": 2.9753229259313578e-05, "epoch": 2.019240506329114, "percentage": 40.41, "elapsed_time": "4:26:25", "remaining_time": "6:32:56"}
498
  {"current_steps": 498, "total_steps": 1230, "loss": 0.3742, "lr": 2.9703637864506274e-05, "epoch": 2.023291139240506, "percentage": 40.49, "elapsed_time": "4:26:53", "remaining_time": "6:32:17"}
499
+ {"current_steps": 499, "total_steps": 1230, "loss": 0.3754, "lr": 2.965396831793362e-05, "epoch": 2.0273417721518987, "percentage": 40.57, "elapsed_time": "4:27:24", "remaining_time": "6:31:43"}
500
+ {"current_steps": 500, "total_steps": 1230, "loss": 0.3876, "lr": 2.9604221019627316e-05, "epoch": 2.031392405063291, "percentage": 40.65, "elapsed_time": "4:27:54", "remaining_time": "6:31:08"}
501
+ {"current_steps": 501, "total_steps": 1230, "loss": 0.3746, "lr": 2.955439637024526e-05, "epoch": 2.0354430379746837, "percentage": 40.73, "elapsed_time": "4:28:30", "remaining_time": "6:30:41"}
502
+ {"current_steps": 502, "total_steps": 1230, "loss": 0.4118, "lr": 2.9504494771068334e-05, "epoch": 2.039493670886076, "percentage": 40.81, "elapsed_time": "4:29:01", "remaining_time": "6:30:08"}
503
+ {"current_steps": 503, "total_steps": 1230, "loss": 0.3885, "lr": 2.9454516623997156e-05, "epoch": 2.0435443037974683, "percentage": 40.89, "elapsed_time": "4:29:34", "remaining_time": "6:29:37"}
504
+ {"current_steps": 504, "total_steps": 1230, "loss": 0.3613, "lr": 2.9404462331548847e-05, "epoch": 2.047594936708861, "percentage": 40.98, "elapsed_time": "4:30:06", "remaining_time": "6:29:04"}
505
+ {"current_steps": 505, "total_steps": 1230, "loss": 0.3652, "lr": 2.93543322968538e-05, "epoch": 2.0516455696202534, "percentage": 41.06, "elapsed_time": "4:30:36", "remaining_time": "6:28:29"}
506
+ {"current_steps": 506, "total_steps": 1230, "loss": 0.3671, "lr": 2.9304126923652428e-05, "epoch": 2.0556962025316454, "percentage": 41.14, "elapsed_time": "4:31:09", "remaining_time": "6:27:58"}
507
+ {"current_steps": 507, "total_steps": 1230, "loss": 0.3653, "lr": 2.9253846616291896e-05, "epoch": 2.059746835443038, "percentage": 41.22, "elapsed_time": "4:31:40", "remaining_time": "6:27:25"}
508
+ {"current_steps": 508, "total_steps": 1230, "loss": 0.3706, "lr": 2.9203491779722896e-05, "epoch": 2.0637974683544305, "percentage": 41.3, "elapsed_time": "4:32:14", "remaining_time": "6:26:55"}
509
+ {"current_steps": 509, "total_steps": 1230, "loss": 0.3598, "lr": 2.9153062819496357e-05, "epoch": 2.067848101265823, "percentage": 41.38, "elapsed_time": "4:32:45", "remaining_time": "6:26:22"}
510
+ {"current_steps": 510, "total_steps": 1230, "loss": 0.3653, "lr": 2.9102560141760178e-05, "epoch": 2.071898734177215, "percentage": 41.46, "elapsed_time": "4:33:15", "remaining_time": "6:25:46"}
511
+ {"current_steps": 511, "total_steps": 1230, "loss": 0.3729, "lr": 2.9051984153256004e-05, "epoch": 2.0759493670886076, "percentage": 41.54, "elapsed_time": "4:33:46", "remaining_time": "6:25:12"}
512
+ {"current_steps": 512, "total_steps": 1230, "loss": 0.3884, "lr": 2.900133526131588e-05, "epoch": 2.08, "percentage": 41.63, "elapsed_time": "4:34:17", "remaining_time": "6:24:39"}
513
+ {"current_steps": 513, "total_steps": 1230, "loss": 0.391, "lr": 2.8950613873859025e-05, "epoch": 2.0840506329113926, "percentage": 41.71, "elapsed_time": "4:34:49", "remaining_time": "6:24:06"}
514
+ {"current_steps": 514, "total_steps": 1230, "loss": 0.383, "lr": 2.8899820399388515e-05, "epoch": 2.0881012658227847, "percentage": 41.79, "elapsed_time": "4:35:26", "remaining_time": "6:23:41"}
515
+ {"current_steps": 515, "total_steps": 1230, "loss": 0.3808, "lr": 2.8848955246988012e-05, "epoch": 2.092151898734177, "percentage": 41.87, "elapsed_time": "4:35:55", "remaining_time": "6:23:04"}
516
+ {"current_steps": 516, "total_steps": 1230, "loss": 0.3948, "lr": 2.879801882631847e-05, "epoch": 2.0962025316455697, "percentage": 41.95, "elapsed_time": "4:36:27", "remaining_time": "6:22:32"}
517
+ {"current_steps": 517, "total_steps": 1230, "loss": 0.3607, "lr": 2.8747011547614808e-05, "epoch": 2.100253164556962, "percentage": 42.03, "elapsed_time": "4:37:07", "remaining_time": "6:22:10"}
518
+ {"current_steps": 518, "total_steps": 1230, "loss": 0.3735, "lr": 2.8695933821682635e-05, "epoch": 2.1043037974683543, "percentage": 42.11, "elapsed_time": "4:37:33", "remaining_time": "6:21:31"}
519
+ {"current_steps": 519, "total_steps": 1230, "loss": 0.3446, "lr": 2.864478605989494e-05, "epoch": 2.108354430379747, "percentage": 42.2, "elapsed_time": "4:38:03", "remaining_time": "6:20:54"}
520
+ {"current_steps": 520, "total_steps": 1230, "loss": 0.3767, "lr": 2.8593568674188765e-05, "epoch": 2.1124050632911393, "percentage": 42.28, "elapsed_time": "4:38:36", "remaining_time": "6:20:24"}
521
+ {"current_steps": 521, "total_steps": 1230, "loss": 0.345, "lr": 2.8542282077061892e-05, "epoch": 2.116455696202532, "percentage": 42.36, "elapsed_time": "4:39:05", "remaining_time": "6:19:47"}
522
+ {"current_steps": 522, "total_steps": 1230, "loss": 0.393, "lr": 2.8490926681569523e-05, "epoch": 2.120506329113924, "percentage": 42.44, "elapsed_time": "4:39:34", "remaining_time": "6:19:11"}
523
+ {"current_steps": 523, "total_steps": 1230, "loss": 0.3649, "lr": 2.8439502901320956e-05, "epoch": 2.1245569620253164, "percentage": 42.52, "elapsed_time": "4:40:07", "remaining_time": "6:18:40"}
524
+ {"current_steps": 524, "total_steps": 1230, "loss": 0.404, "lr": 2.8388011150476237e-05, "epoch": 2.128607594936709, "percentage": 42.6, "elapsed_time": "4:40:41", "remaining_time": "6:18:11"}
525
+ {"current_steps": 525, "total_steps": 1230, "loss": 0.3892, "lr": 2.8336451843742866e-05, "epoch": 2.1326582278481014, "percentage": 42.68, "elapsed_time": "4:41:16", "remaining_time": "6:17:42"}
526
+ {"current_steps": 526, "total_steps": 1230, "loss": 0.3633, "lr": 2.8284825396372387e-05, "epoch": 2.1367088607594935, "percentage": 42.76, "elapsed_time": "4:41:47", "remaining_time": "6:17:08"}
527
+ {"current_steps": 527, "total_steps": 1230, "loss": 0.3946, "lr": 2.8233132224157132e-05, "epoch": 2.140759493670886, "percentage": 42.85, "elapsed_time": "4:42:16", "remaining_time": "6:16:32"}
528
+ {"current_steps": 528, "total_steps": 1230, "loss": 0.393, "lr": 2.8181372743426805e-05, "epoch": 2.1448101265822785, "percentage": 42.93, "elapsed_time": "4:42:51", "remaining_time": "6:16:04"}
529
+ {"current_steps": 529, "total_steps": 1230, "loss": 0.402, "lr": 2.8129547371045128e-05, "epoch": 2.148860759493671, "percentage": 43.01, "elapsed_time": "4:43:19", "remaining_time": "6:15:26"}
530
+ {"current_steps": 530, "total_steps": 1230, "loss": 0.4123, "lr": 2.8077656524406534e-05, "epoch": 2.152911392405063, "percentage": 43.09, "elapsed_time": "4:43:50", "remaining_time": "6:14:53"}
531
+ {"current_steps": 531, "total_steps": 1230, "loss": 0.3916, "lr": 2.802570062143278e-05, "epoch": 2.1569620253164556, "percentage": 43.17, "elapsed_time": "4:44:23", "remaining_time": "6:14:21"}
532
+ {"current_steps": 532, "total_steps": 1230, "loss": 0.4087, "lr": 2.7973680080569555e-05, "epoch": 2.161012658227848, "percentage": 43.25, "elapsed_time": "4:44:54", "remaining_time": "6:13:48"}
533
+ {"current_steps": 533, "total_steps": 1230, "loss": 0.3777, "lr": 2.792159532078314e-05, "epoch": 2.1650632911392407, "percentage": 43.33, "elapsed_time": "4:45:23", "remaining_time": "6:13:12"}
534
+ {"current_steps": 534, "total_steps": 1230, "loss": 0.3634, "lr": 2.7869446761557033e-05, "epoch": 2.1691139240506327, "percentage": 43.41, "elapsed_time": "4:46:00", "remaining_time": "6:12:46"}
535
+ {"current_steps": 535, "total_steps": 1230, "loss": 0.402, "lr": 2.781723482288857e-05, "epoch": 2.1731645569620253, "percentage": 43.5, "elapsed_time": "4:46:32", "remaining_time": "6:12:13"}
536
+ {"current_steps": 536, "total_steps": 1230, "loss": 0.3529, "lr": 2.7764959925285517e-05, "epoch": 2.1772151898734178, "percentage": 43.58, "elapsed_time": "4:47:04", "remaining_time": "6:11:42"}
537
+ {"current_steps": 537, "total_steps": 1230, "loss": 0.3797, "lr": 2.771262248976272e-05, "epoch": 2.1812658227848103, "percentage": 43.66, "elapsed_time": "4:47:35", "remaining_time": "6:11:07"}
538
+ {"current_steps": 538, "total_steps": 1230, "loss": 0.3816, "lr": 2.7660222937838677e-05, "epoch": 2.1853164556962024, "percentage": 43.74, "elapsed_time": "4:48:00", "remaining_time": "6:10:27"}
539
+ {"current_steps": 539, "total_steps": 1230, "loss": 0.385, "lr": 2.7607761691532186e-05, "epoch": 2.189367088607595, "percentage": 43.82, "elapsed_time": "4:48:31", "remaining_time": "6:09:52"}
540
+ {"current_steps": 540, "total_steps": 1230, "loss": 0.3852, "lr": 2.7555239173358916e-05, "epoch": 2.1934177215189874, "percentage": 43.9, "elapsed_time": "4:49:01", "remaining_time": "6:09:18"}
541
+ {"current_steps": 541, "total_steps": 1230, "loss": 0.3666, "lr": 2.7502655806328e-05, "epoch": 2.19746835443038, "percentage": 43.98, "elapsed_time": "4:49:30", "remaining_time": "6:08:42"}
542
+ {"current_steps": 542, "total_steps": 1230, "loss": 0.3725, "lr": 2.7450012013938648e-05, "epoch": 2.201518987341772, "percentage": 44.07, "elapsed_time": "4:50:00", "remaining_time": "6:08:07"}
543
+ {"current_steps": 543, "total_steps": 1230, "loss": 0.3994, "lr": 2.739730822017673e-05, "epoch": 2.2055696202531645, "percentage": 44.15, "elapsed_time": "4:50:28", "remaining_time": "6:07:30"}
544
+ {"current_steps": 544, "total_steps": 1230, "loss": 0.3934, "lr": 2.7344544849511355e-05, "epoch": 2.209620253164557, "percentage": 44.23, "elapsed_time": "4:51:10", "remaining_time": "6:07:10"}
545
+ {"current_steps": 545, "total_steps": 1230, "loss": 0.394, "lr": 2.7291722326891456e-05, "epoch": 2.2136708860759495, "percentage": 44.31, "elapsed_time": "4:51:41", "remaining_time": "6:06:37"}
546
+ {"current_steps": 546, "total_steps": 1230, "loss": 0.3661, "lr": 2.723884107774236e-05, "epoch": 2.2177215189873416, "percentage": 44.39, "elapsed_time": "4:52:11", "remaining_time": "6:06:03"}
547
+ {"current_steps": 547, "total_steps": 1230, "loss": 0.3785, "lr": 2.718590152796239e-05, "epoch": 2.221772151898734, "percentage": 44.47, "elapsed_time": "4:52:48", "remaining_time": "6:05:36"}
548
+ {"current_steps": 548, "total_steps": 1230, "loss": 0.3811, "lr": 2.71329041039194e-05, "epoch": 2.2258227848101266, "percentage": 44.55, "elapsed_time": "4:53:22", "remaining_time": "6:05:06"}
549
+ {"current_steps": 549, "total_steps": 1230, "loss": 0.3889, "lr": 2.7079849232447357e-05, "epoch": 2.229873417721519, "percentage": 44.63, "elapsed_time": "4:53:58", "remaining_time": "6:04:39"}
550
+ {"current_steps": 550, "total_steps": 1230, "loss": 0.3943, "lr": 2.7026737340842895e-05, "epoch": 2.233924050632911, "percentage": 44.72, "elapsed_time": "4:54:32", "remaining_time": "6:04:10"}
551
+ {"current_steps": 551, "total_steps": 1230, "loss": 0.3801, "lr": 2.697356885686189e-05, "epoch": 2.2379746835443037, "percentage": 44.8, "elapsed_time": "4:55:03", "remaining_time": "6:03:36"}
552
+ {"current_steps": 552, "total_steps": 1230, "loss": 0.3801, "lr": 2.6920344208716014e-05, "epoch": 2.2420253164556962, "percentage": 44.88, "elapsed_time": "4:55:38", "remaining_time": "6:03:08"}
553
+ {"current_steps": 553, "total_steps": 1230, "loss": 0.3678, "lr": 2.6867063825069252e-05, "epoch": 2.2460759493670888, "percentage": 44.96, "elapsed_time": "4:56:09", "remaining_time": "6:02:34"}
554
+ {"current_steps": 554, "total_steps": 1230, "loss": 0.3823, "lr": 2.6813728135034494e-05, "epoch": 2.250126582278481, "percentage": 45.04, "elapsed_time": "4:56:40", "remaining_time": "6:02:00"}
555
+ {"current_steps": 555, "total_steps": 1230, "loss": 0.3998, "lr": 2.6760337568170056e-05, "epoch": 2.2541772151898734, "percentage": 45.12, "elapsed_time": "4:57:09", "remaining_time": "6:01:24"}
556
+ {"current_steps": 556, "total_steps": 1230, "loss": 0.3578, "lr": 2.6706892554476226e-05, "epoch": 2.258227848101266, "percentage": 45.2, "elapsed_time": "4:57:42", "remaining_time": "6:00:53"}
557
+ {"current_steps": 557, "total_steps": 1230, "loss": 0.39, "lr": 2.6653393524391795e-05, "epoch": 2.2622784810126584, "percentage": 45.28, "elapsed_time": "4:58:17", "remaining_time": "6:00:25"}
558
+ {"current_steps": 558, "total_steps": 1230, "loss": 0.3805, "lr": 2.6599840908790592e-05, "epoch": 2.2663291139240505, "percentage": 45.37, "elapsed_time": "4:58:53", "remaining_time": "5:59:57"}
559
+ {"current_steps": 559, "total_steps": 1230, "loss": 0.3816, "lr": 2.6546235138978028e-05, "epoch": 2.270379746835443, "percentage": 45.45, "elapsed_time": "4:59:22", "remaining_time": "5:59:21"}
560
+ {"current_steps": 560, "total_steps": 1230, "loss": 0.3709, "lr": 2.6492576646687597e-05, "epoch": 2.2744303797468355, "percentage": 45.53, "elapsed_time": "4:59:49", "remaining_time": "5:58:43"}
561
+ {"current_steps": 561, "total_steps": 1230, "loss": 0.3961, "lr": 2.6438865864077425e-05, "epoch": 2.278481012658228, "percentage": 45.61, "elapsed_time": "5:00:19", "remaining_time": "5:58:08"}
562
+ {"current_steps": 562, "total_steps": 1230, "loss": 0.376, "lr": 2.6385103223726766e-05, "epoch": 2.28253164556962, "percentage": 45.69, "elapsed_time": "5:00:57", "remaining_time": "5:57:42"}
563
+ {"current_steps": 563, "total_steps": 1230, "loss": 0.369, "lr": 2.6331289158632537e-05, "epoch": 2.2865822784810126, "percentage": 45.77, "elapsed_time": "5:01:28", "remaining_time": "5:57:09"}
564
+ {"current_steps": 564, "total_steps": 1230, "loss": 0.4034, "lr": 2.6277424102205817e-05, "epoch": 2.290632911392405, "percentage": 45.85, "elapsed_time": "5:02:02", "remaining_time": "5:56:39"}
565
+ {"current_steps": 565, "total_steps": 1230, "loss": 0.3951, "lr": 2.6223508488268374e-05, "epoch": 2.2946835443037976, "percentage": 45.93, "elapsed_time": "5:02:35", "remaining_time": "5:56:08"}
566
+ {"current_steps": 566, "total_steps": 1230, "loss": 0.3944, "lr": 2.6169542751049148e-05, "epoch": 2.2987341772151897, "percentage": 46.02, "elapsed_time": "5:03:03", "remaining_time": "5:55:32"}
567
+ {"current_steps": 567, "total_steps": 1230, "loss": 0.3961, "lr": 2.6115527325180754e-05, "epoch": 2.302784810126582, "percentage": 46.1, "elapsed_time": "5:03:40", "remaining_time": "5:55:05"}
568
+ {"current_steps": 568, "total_steps": 1230, "loss": 0.3815, "lr": 2.606146264569603e-05, "epoch": 2.3068354430379747, "percentage": 46.18, "elapsed_time": "5:04:10", "remaining_time": "5:54:30"}
569
+ {"current_steps": 569, "total_steps": 1230, "loss": 0.3677, "lr": 2.6007349148024447e-05, "epoch": 2.3108860759493672, "percentage": 46.26, "elapsed_time": "5:04:37", "remaining_time": "5:53:52"}
570
+ {"current_steps": 570, "total_steps": 1230, "loss": 0.3755, "lr": 2.5953187267988694e-05, "epoch": 2.3149367088607593, "percentage": 46.34, "elapsed_time": "5:05:10", "remaining_time": "5:53:21"}
571
+ {"current_steps": 571, "total_steps": 1230, "loss": 0.3932, "lr": 2.5898977441801097e-05, "epoch": 2.318987341772152, "percentage": 46.42, "elapsed_time": "5:05:40", "remaining_time": "5:52:47"}
572
+ {"current_steps": 572, "total_steps": 1230, "loss": 0.3802, "lr": 2.584472010606015e-05, "epoch": 2.3230379746835443, "percentage": 46.5, "elapsed_time": "5:06:11", "remaining_time": "5:52:13"}
573
+ {"current_steps": 573, "total_steps": 1230, "loss": 0.3786, "lr": 2.5790415697746976e-05, "epoch": 2.327088607594937, "percentage": 46.59, "elapsed_time": "5:06:45", "remaining_time": "5:51:44"}
574
+ {"current_steps": 574, "total_steps": 1230, "loss": 0.3756, "lr": 2.5736064654221808e-05, "epoch": 2.331139240506329, "percentage": 46.67, "elapsed_time": "5:07:20", "remaining_time": "5:51:15"}
575
+ {"current_steps": 575, "total_steps": 1230, "loss": 0.3893, "lr": 2.568166741322048e-05, "epoch": 2.3351898734177214, "percentage": 46.75, "elapsed_time": "5:07:55", "remaining_time": "5:50:46"}
576
+ {"current_steps": 576, "total_steps": 1230, "loss": 0.4123, "lr": 2.56272244128509e-05, "epoch": 2.339240506329114, "percentage": 46.83, "elapsed_time": "5:08:34", "remaining_time": "5:50:21"}
577
+ {"current_steps": 577, "total_steps": 1230, "loss": 0.3742, "lr": 2.55727360915895e-05, "epoch": 2.3432911392405065, "percentage": 46.91, "elapsed_time": "5:09:04", "remaining_time": "5:49:47"}
578
+ {"current_steps": 578, "total_steps": 1230, "loss": 0.3823, "lr": 2.5518202888277734e-05, "epoch": 2.3473417721518985, "percentage": 46.99, "elapsed_time": "5:09:30", "remaining_time": "5:49:07"}
579
+ {"current_steps": 579, "total_steps": 1230, "loss": 0.3938, "lr": 2.5463625242118523e-05, "epoch": 2.351392405063291, "percentage": 47.07, "elapsed_time": "5:10:06", "remaining_time": "5:48:40"}
580
+ {"current_steps": 580, "total_steps": 1230, "loss": 0.3902, "lr": 2.5409003592672723e-05, "epoch": 2.3554430379746836, "percentage": 47.15, "elapsed_time": "5:10:41", "remaining_time": "5:48:11"}
581
+ {"current_steps": 581, "total_steps": 1230, "loss": 0.3695, "lr": 2.535433837985559e-05, "epoch": 2.359493670886076, "percentage": 47.24, "elapsed_time": "5:11:08", "remaining_time": "5:47:33"}
582
+ {"current_steps": 582, "total_steps": 1230, "loss": 0.4116, "lr": 2.529963004393324e-05, "epoch": 2.363544303797468, "percentage": 47.32, "elapsed_time": "5:11:39", "remaining_time": "5:46:59"}
583
+ {"current_steps": 583, "total_steps": 1230, "loss": 0.3852, "lr": 2.524487902551908e-05, "epoch": 2.3675949367088607, "percentage": 47.4, "elapsed_time": "5:12:11", "remaining_time": "5:46:27"}
584
+ {"current_steps": 584, "total_steps": 1230, "loss": 0.3975, "lr": 2.519008576557029e-05, "epoch": 2.371645569620253, "percentage": 47.48, "elapsed_time": "5:12:43", "remaining_time": "5:45:54"}
585
+ {"current_steps": 585, "total_steps": 1230, "loss": 0.3857, "lr": 2.5135250705384254e-05, "epoch": 2.3756962025316457, "percentage": 47.56, "elapsed_time": "5:13:13", "remaining_time": "5:45:20"}
586
+ {"current_steps": 586, "total_steps": 1230, "loss": 0.3527, "lr": 2.5080374286595007e-05, "epoch": 2.379746835443038, "percentage": 47.64, "elapsed_time": "5:13:50", "remaining_time": "5:44:53"}
587
+ {"current_steps": 587, "total_steps": 1230, "loss": 0.3991, "lr": 2.5025456951169677e-05, "epoch": 2.3837974683544303, "percentage": 47.72, "elapsed_time": "5:14:18", "remaining_time": "5:44:18"}
588
+ {"current_steps": 588, "total_steps": 1230, "loss": 0.4076, "lr": 2.4970499141404942e-05, "epoch": 2.387848101265823, "percentage": 47.8, "elapsed_time": "5:14:54", "remaining_time": "5:43:50"}
589
+ {"current_steps": 589, "total_steps": 1230, "loss": 0.3793, "lr": 2.491550129992345e-05, "epoch": 2.3918987341772153, "percentage": 47.89, "elapsed_time": "5:15:21", "remaining_time": "5:43:12"}
590
+ {"current_steps": 590, "total_steps": 1230, "loss": 0.3915, "lr": 2.486046386967024e-05, "epoch": 2.3959493670886074, "percentage": 47.97, "elapsed_time": "5:15:48", "remaining_time": "5:42:34"}
591
+ {"current_steps": 591, "total_steps": 1230, "loss": 0.3762, "lr": 2.4805387293909214e-05, "epoch": 2.4, "percentage": 48.05, "elapsed_time": "5:16:19", "remaining_time": "5:42:01"}
592
+ {"current_steps": 592, "total_steps": 1230, "loss": 0.3653, "lr": 2.4750272016219552e-05, "epoch": 2.4040506329113924, "percentage": 48.13, "elapsed_time": "5:16:48", "remaining_time": "5:41:25"}
593
+ {"current_steps": 593, "total_steps": 1230, "loss": 0.3942, "lr": 2.4695118480492114e-05, "epoch": 2.408101265822785, "percentage": 48.21, "elapsed_time": "5:17:22", "remaining_time": "5:40:55"}
594
+ {"current_steps": 594, "total_steps": 1230, "loss": 0.3953, "lr": 2.4639927130925898e-05, "epoch": 2.4121518987341775, "percentage": 48.29, "elapsed_time": "5:17:55", "remaining_time": "5:40:24"}
595
+ {"current_steps": 595, "total_steps": 1230, "loss": 0.4026, "lr": 2.458469841202444e-05, "epoch": 2.4162025316455695, "percentage": 48.37, "elapsed_time": "5:18:29", "remaining_time": "5:39:54"}
596
+ {"current_steps": 596, "total_steps": 1230, "loss": 0.3804, "lr": 2.452943276859226e-05, "epoch": 2.420253164556962, "percentage": 48.46, "elapsed_time": "5:19:02", "remaining_time": "5:39:23"}
597
+ {"current_steps": 597, "total_steps": 1230, "loss": 0.3818, "lr": 2.447413064573125e-05, "epoch": 2.4243037974683546, "percentage": 48.54, "elapsed_time": "5:19:33", "remaining_time": "5:38:49"}
598
+ {"current_steps": 598, "total_steps": 1230, "loss": 0.3784, "lr": 2.4418792488837095e-05, "epoch": 2.4283544303797466, "percentage": 48.62, "elapsed_time": "5:20:04", "remaining_time": "5:38:16"}
599
+ {"current_steps": 599, "total_steps": 1230, "loss": 0.3923, "lr": 2.4363418743595713e-05, "epoch": 2.432405063291139, "percentage": 48.7, "elapsed_time": "5:20:39", "remaining_time": "5:37:47"}
600
+ {"current_steps": 600, "total_steps": 1230, "loss": 0.3961, "lr": 2.430800985597963e-05, "epoch": 2.4364556962025317, "percentage": 48.78, "elapsed_time": "5:21:16", "remaining_time": "5:37:20"}
601
+ {"current_steps": 601, "total_steps": 1230, "loss": 0.378, "lr": 2.4252566272244415e-05, "epoch": 2.440506329113924, "percentage": 48.86, "elapsed_time": "5:21:44", "remaining_time": "5:36:44"}
602
+ {"current_steps": 602, "total_steps": 1230, "loss": 0.3781, "lr": 2.4197088438925063e-05, "epoch": 2.4445569620253167, "percentage": 48.94, "elapsed_time": "5:22:19", "remaining_time": "5:36:14"}
603
+ {"current_steps": 603, "total_steps": 1230, "loss": 0.3907, "lr": 2.4141576802832417e-05, "epoch": 2.4486075949367088, "percentage": 49.02, "elapsed_time": "5:22:51", "remaining_time": "5:35:42"}
604
+ {"current_steps": 604, "total_steps": 1230, "loss": 0.3871, "lr": 2.408603181104957e-05, "epoch": 2.4526582278481013, "percentage": 49.11, "elapsed_time": "5:23:20", "remaining_time": "5:35:06"}
605
+ {"current_steps": 605, "total_steps": 1230, "loss": 0.3922, "lr": 2.4030453910928245e-05, "epoch": 2.456708860759494, "percentage": 49.19, "elapsed_time": "5:23:53", "remaining_time": "5:34:35"}
606
+ {"current_steps": 606, "total_steps": 1230, "loss": 0.3797, "lr": 2.397484355008521e-05, "epoch": 2.460759493670886, "percentage": 49.27, "elapsed_time": "5:24:27", "remaining_time": "5:34:05"}
607
+ {"current_steps": 607, "total_steps": 1230, "loss": 0.3823, "lr": 2.3919201176398662e-05, "epoch": 2.4648101265822784, "percentage": 49.35, "elapsed_time": "5:25:02", "remaining_time": "5:33:36"}
608
+ {"current_steps": 608, "total_steps": 1230, "loss": 0.3601, "lr": 2.3863527238004633e-05, "epoch": 2.468860759493671, "percentage": 49.43, "elapsed_time": "5:25:31", "remaining_time": "5:33:01"}
609
+ {"current_steps": 609, "total_steps": 1230, "loss": 0.3877, "lr": 2.380782218329337e-05, "epoch": 2.4729113924050634, "percentage": 49.51, "elapsed_time": "5:26:01", "remaining_time": "5:32:26"}
610
+ {"current_steps": 610, "total_steps": 1230, "loss": 0.3858, "lr": 2.3752086460905725e-05, "epoch": 2.476962025316456, "percentage": 49.59, "elapsed_time": "5:26:34", "remaining_time": "5:31:55"}
611
+ {"current_steps": 611, "total_steps": 1230, "loss": 0.375, "lr": 2.3696320519729544e-05, "epoch": 2.481012658227848, "percentage": 49.67, "elapsed_time": "5:27:09", "remaining_time": "5:31:26"}
612
+ {"current_steps": 612, "total_steps": 1230, "loss": 0.3574, "lr": 2.3640524808896045e-05, "epoch": 2.4850632911392405, "percentage": 49.76, "elapsed_time": "5:27:39", "remaining_time": "5:30:52"}
613
+ {"current_steps": 613, "total_steps": 1230, "loss": 0.3915, "lr": 2.3584699777776222e-05, "epoch": 2.489113924050633, "percentage": 49.84, "elapsed_time": "5:28:11", "remaining_time": "5:30:19"}
614
+ {"current_steps": 614, "total_steps": 1230, "loss": 0.3974, "lr": 2.3528845875977195e-05, "epoch": 2.493164556962025, "percentage": 49.92, "elapsed_time": "5:28:44", "remaining_time": "5:29:48"}
615
+ {"current_steps": 615, "total_steps": 1230, "loss": 0.3921, "lr": 2.3472963553338614e-05, "epoch": 2.4972151898734176, "percentage": 50.0, "elapsed_time": "5:29:13", "remaining_time": "5:29:13"}
616
+ {"current_steps": 616, "total_steps": 1230, "loss": 0.3796, "lr": 2.341705325992901e-05, "epoch": 2.50126582278481, "percentage": 50.08, "elapsed_time": "5:29:44", "remaining_time": "5:28:40"}
617
+ {"current_steps": 617, "total_steps": 1230, "loss": 0.3963, "lr": 2.336111544604222e-05, "epoch": 2.5053164556962026, "percentage": 50.16, "elapsed_time": "5:30:15", "remaining_time": "5:28:06"}
618
+ {"current_steps": 618, "total_steps": 1230, "loss": 0.4117, "lr": 2.33051505621937e-05, "epoch": 2.509367088607595, "percentage": 50.24, "elapsed_time": "5:30:43", "remaining_time": "5:27:30"}
619
+ {"current_steps": 619, "total_steps": 1230, "loss": 0.3783, "lr": 2.324915905911693e-05, "epoch": 2.5134177215189872, "percentage": 50.33, "elapsed_time": "5:31:14", "remaining_time": "5:26:57"}
620
+ {"current_steps": 620, "total_steps": 1230, "loss": 0.3933, "lr": 2.319314138775977e-05, "epoch": 2.5174683544303798, "percentage": 50.41, "elapsed_time": "5:31:46", "remaining_time": "5:26:25"}
621
+ {"current_steps": 621, "total_steps": 1230, "loss": 0.3985, "lr": 2.3137097999280856e-05, "epoch": 2.5215189873417723, "percentage": 50.49, "elapsed_time": "5:32:20", "remaining_time": "5:25:55"}
622
+ {"current_steps": 622, "total_steps": 1230, "loss": 0.3726, "lr": 2.308102934504593e-05, "epoch": 2.5255696202531643, "percentage": 50.57, "elapsed_time": "5:32:50", "remaining_time": "5:25:20"}
623
+ {"current_steps": 623, "total_steps": 1230, "loss": 0.3937, "lr": 2.3024935876624222e-05, "epoch": 2.529620253164557, "percentage": 50.65, "elapsed_time": "5:33:16", "remaining_time": "5:24:43"}
624
+ {"current_steps": 624, "total_steps": 1230, "loss": 0.3895, "lr": 2.2968818045784813e-05, "epoch": 2.5336708860759494, "percentage": 50.73, "elapsed_time": "5:33:44", "remaining_time": "5:24:07"}
625
+ {"current_steps": 625, "total_steps": 1230, "loss": 0.3964, "lr": 2.2912676304493006e-05, "epoch": 2.537721518987342, "percentage": 50.81, "elapsed_time": "5:34:19", "remaining_time": "5:23:37"}
626
+ {"current_steps": 626, "total_steps": 1230, "loss": 0.3825, "lr": 2.2856511104906668e-05, "epoch": 2.5417721518987344, "percentage": 50.89, "elapsed_time": "5:34:49", "remaining_time": "5:23:03"}
627
+ {"current_steps": 627, "total_steps": 1230, "loss": 0.3884, "lr": 2.2800322899372586e-05, "epoch": 2.5458227848101265, "percentage": 50.98, "elapsed_time": "5:35:20", "remaining_time": "5:22:30"}
628
+ {"current_steps": 628, "total_steps": 1230, "loss": 0.3779, "lr": 2.2744112140422844e-05, "epoch": 2.549873417721519, "percentage": 51.06, "elapsed_time": "5:35:51", "remaining_time": "5:21:57"}
629
+ {"current_steps": 629, "total_steps": 1230, "loss": 0.3953, "lr": 2.2687879280771177e-05, "epoch": 2.5539240506329115, "percentage": 51.14, "elapsed_time": "5:36:23", "remaining_time": "5:21:25"}
630
+ {"current_steps": 630, "total_steps": 1230, "loss": 0.3718, "lr": 2.26316247733093e-05, "epoch": 2.5579746835443036, "percentage": 51.22, "elapsed_time": "5:37:01", "remaining_time": "5:20:58"}
631
+ {"current_steps": 631, "total_steps": 1230, "loss": 0.4081, "lr": 2.257534907110328e-05, "epoch": 2.562025316455696, "percentage": 51.3, "elapsed_time": "5:37:36", "remaining_time": "5:20:28"}
632
+ {"current_steps": 632, "total_steps": 1230, "loss": 0.3901, "lr": 2.2519052627389882e-05, "epoch": 2.5660759493670886, "percentage": 51.38, "elapsed_time": "5:38:11", "remaining_time": "5:19:59"}
633
+ {"current_steps": 633, "total_steps": 1230, "loss": 0.3792, "lr": 2.246273589557294e-05, "epoch": 2.570126582278481, "percentage": 51.46, "elapsed_time": "5:38:40", "remaining_time": "5:19:25"}
634
+ {"current_steps": 634, "total_steps": 1230, "loss": 0.4045, "lr": 2.240639932921966e-05, "epoch": 2.5741772151898736, "percentage": 51.54, "elapsed_time": "5:39:19", "remaining_time": "5:18:59"}
635
+ {"current_steps": 635, "total_steps": 1230, "loss": 0.3751, "lr": 2.2350043382056995e-05, "epoch": 2.5782278481012657, "percentage": 51.63, "elapsed_time": "5:39:48", "remaining_time": "5:18:24"}
636
+ {"current_steps": 636, "total_steps": 1230, "loss": 0.384, "lr": 2.2293668507968015e-05, "epoch": 2.5822784810126582, "percentage": 51.71, "elapsed_time": "5:40:19", "remaining_time": "5:17:50"}
637
+ {"current_steps": 637, "total_steps": 1230, "loss": 0.3885, "lr": 2.2237275160988186e-05, "epoch": 2.5863291139240507, "percentage": 51.79, "elapsed_time": "5:40:49", "remaining_time": "5:17:17"}
638
+ {"current_steps": 638, "total_steps": 1230, "loss": 0.3965, "lr": 2.2180863795301787e-05, "epoch": 2.590379746835443, "percentage": 51.87, "elapsed_time": "5:41:22", "remaining_time": "5:16:45"}
639
+ {"current_steps": 639, "total_steps": 1230, "loss": 0.3858, "lr": 2.212443486523819e-05, "epoch": 2.5944303797468353, "percentage": 51.95, "elapsed_time": "5:41:51", "remaining_time": "5:16:10"}
640
+ {"current_steps": 640, "total_steps": 1230, "loss": 0.3904, "lr": 2.2067988825268243e-05, "epoch": 2.598481012658228, "percentage": 52.03, "elapsed_time": "5:42:28", "remaining_time": "5:15:43"}
641
+ {"current_steps": 641, "total_steps": 1230, "loss": 0.3964, "lr": 2.2011526130000596e-05, "epoch": 2.6025316455696204, "percentage": 52.11, "elapsed_time": "5:43:00", "remaining_time": "5:15:10"}
642
+ {"current_steps": 642, "total_steps": 1230, "loss": 0.4028, "lr": 2.1955047234178038e-05, "epoch": 2.606582278481013, "percentage": 52.2, "elapsed_time": "5:43:33", "remaining_time": "5:14:39"}
643
+ {"current_steps": 643, "total_steps": 1230, "loss": 0.3789, "lr": 2.1898552592673825e-05, "epoch": 2.610632911392405, "percentage": 52.28, "elapsed_time": "5:44:03", "remaining_time": "5:14:05"}
644
+ {"current_steps": 644, "total_steps": 1230, "loss": 0.3947, "lr": 2.184204266048803e-05, "epoch": 2.6146835443037975, "percentage": 52.36, "elapsed_time": "5:44:37", "remaining_time": "5:13:35"}
645
+ {"current_steps": 645, "total_steps": 1230, "loss": 0.3901, "lr": 2.1785517892743887e-05, "epoch": 2.61873417721519, "percentage": 52.44, "elapsed_time": "5:45:10", "remaining_time": "5:13:04"}
646
+ {"current_steps": 646, "total_steps": 1230, "loss": 0.3862, "lr": 2.17289787446841e-05, "epoch": 2.622784810126582, "percentage": 52.52, "elapsed_time": "5:45:43", "remaining_time": "5:12:32"}
647
+ {"current_steps": 647, "total_steps": 1230, "loss": 0.3675, "lr": 2.1672425671667198e-05, "epoch": 2.6268354430379746, "percentage": 52.6, "elapsed_time": "5:46:17", "remaining_time": "5:12:02"}
648
+ {"current_steps": 648, "total_steps": 1230, "loss": 0.3697, "lr": 2.161585912916385e-05, "epoch": 2.630886075949367, "percentage": 52.68, "elapsed_time": "5:46:53", "remaining_time": "5:11:33"}
649
+ {"current_steps": 649, "total_steps": 1230, "loss": 0.3812, "lr": 2.1559279572753214e-05, "epoch": 2.6349367088607596, "percentage": 52.76, "elapsed_time": "5:47:30", "remaining_time": "5:11:05"}
650
+ {"current_steps": 650, "total_steps": 1230, "loss": 0.3887, "lr": 2.1502687458119268e-05, "epoch": 2.638987341772152, "percentage": 52.85, "elapsed_time": "5:48:02", "remaining_time": "5:10:33"}
651
+ {"current_steps": 651, "total_steps": 1230, "loss": 0.3866, "lr": 2.1446083241047116e-05, "epoch": 2.643037974683544, "percentage": 52.93, "elapsed_time": "5:48:34", "remaining_time": "5:10:01"}
652
+ {"current_steps": 652, "total_steps": 1230, "loss": 0.3956, "lr": 2.1389467377419333e-05, "epoch": 2.6470886075949367, "percentage": 53.01, "elapsed_time": "5:49:04", "remaining_time": "5:09:27"}
653
+ {"current_steps": 653, "total_steps": 1230, "loss": 0.3657, "lr": 2.133284032321232e-05, "epoch": 2.651139240506329, "percentage": 53.09, "elapsed_time": "5:49:33", "remaining_time": "5:08:52"}
654
+ {"current_steps": 654, "total_steps": 1230, "loss": 0.409, "lr": 2.1276202534492566e-05, "epoch": 2.6551898734177213, "percentage": 53.17, "elapsed_time": "5:50:05", "remaining_time": "5:08:20"}
655
+ {"current_steps": 655, "total_steps": 1230, "loss": 0.369, "lr": 2.121955446741306e-05, "epoch": 2.659240506329114, "percentage": 53.25, "elapsed_time": "5:50:32", "remaining_time": "5:07:43"}
656
+ {"current_steps": 656, "total_steps": 1230, "loss": 0.3795, "lr": 2.1162896578209517e-05, "epoch": 2.6632911392405063, "percentage": 53.33, "elapsed_time": "5:51:06", "remaining_time": "5:07:13"}
657
+ {"current_steps": 657, "total_steps": 1230, "loss": 0.3919, "lr": 2.1106229323196813e-05, "epoch": 2.667341772151899, "percentage": 53.41, "elapsed_time": "5:51:31", "remaining_time": "5:06:35"}
658
+ {"current_steps": 658, "total_steps": 1230, "loss": 0.3677, "lr": 2.1049553158765214e-05, "epoch": 2.6713924050632913, "percentage": 53.5, "elapsed_time": "5:52:02", "remaining_time": "5:06:01"}
659
+ {"current_steps": 659, "total_steps": 1230, "loss": 0.3725, "lr": 2.0992868541376764e-05, "epoch": 2.6754430379746834, "percentage": 53.58, "elapsed_time": "5:52:33", "remaining_time": "5:05:28"}
660
+ {"current_steps": 660, "total_steps": 1230, "loss": 0.3942, "lr": 2.093617592756158e-05, "epoch": 2.679493670886076, "percentage": 53.66, "elapsed_time": "5:53:07", "remaining_time": "5:04:58"}
661
+ {"current_steps": 661, "total_steps": 1230, "loss": 0.3934, "lr": 2.0879475773914167e-05, "epoch": 2.6835443037974684, "percentage": 53.74, "elapsed_time": "5:53:35", "remaining_time": "5:04:22"}
662
+ {"current_steps": 662, "total_steps": 1230, "loss": 0.4124, "lr": 2.082276853708978e-05, "epoch": 2.6875949367088605, "percentage": 53.82, "elapsed_time": "5:54:07", "remaining_time": "5:03:50"}
663
+ {"current_steps": 663, "total_steps": 1230, "loss": 0.3885, "lr": 2.076605467380071e-05, "epoch": 2.691645569620253, "percentage": 53.9, "elapsed_time": "5:54:39", "remaining_time": "5:03:18"}
664
+ {"current_steps": 664, "total_steps": 1230, "loss": 0.3675, "lr": 2.0709334640812613e-05, "epoch": 2.6956962025316455, "percentage": 53.98, "elapsed_time": "5:55:09", "remaining_time": "5:02:44"}
665
+ {"current_steps": 665, "total_steps": 1230, "loss": 0.4043, "lr": 2.0652608894940824e-05, "epoch": 2.699746835443038, "percentage": 54.07, "elapsed_time": "5:55:40", "remaining_time": "5:02:11"}
666
+ {"current_steps": 666, "total_steps": 1230, "loss": 0.3861, "lr": 2.0595877893046722e-05, "epoch": 2.7037974683544306, "percentage": 54.15, "elapsed_time": "5:56:14", "remaining_time": "5:01:40"}
667
+ {"current_steps": 667, "total_steps": 1230, "loss": 0.3886, "lr": 2.0539142092033985e-05, "epoch": 2.7078481012658226, "percentage": 54.23, "elapsed_time": "5:56:44", "remaining_time": "5:01:06"}
668
+ {"current_steps": 668, "total_steps": 1230, "loss": 0.3689, "lr": 2.048240194884496e-05, "epoch": 2.711898734177215, "percentage": 54.31, "elapsed_time": "5:57:14", "remaining_time": "5:00:33"}
669
+ {"current_steps": 669, "total_steps": 1230, "loss": 0.375, "lr": 2.042565792045695e-05, "epoch": 2.7159493670886077, "percentage": 54.39, "elapsed_time": "5:57:44", "remaining_time": "4:59:59"}
670
+ {"current_steps": 670, "total_steps": 1230, "loss": 0.3749, "lr": 2.036891046387857e-05, "epoch": 2.7199999999999998, "percentage": 54.47, "elapsed_time": "5:58:19", "remaining_time": "4:59:29"}
671
+ {"current_steps": 671, "total_steps": 1230, "loss": 0.3927, "lr": 2.0312160036146036e-05, "epoch": 2.7240506329113923, "percentage": 54.55, "elapsed_time": "5:58:47", "remaining_time": "4:58:53"}
672
+ {"current_steps": 672, "total_steps": 1230, "loss": 0.3885, "lr": 2.025540709431948e-05, "epoch": 2.728101265822785, "percentage": 54.63, "elapsed_time": "5:59:17", "remaining_time": "4:58:20"}
673
+ {"current_steps": 673, "total_steps": 1230, "loss": 0.3918, "lr": 2.0198652095479298e-05, "epoch": 2.7321518987341773, "percentage": 54.72, "elapsed_time": "5:59:48", "remaining_time": "4:57:47"}
674
+ {"current_steps": 674, "total_steps": 1230, "loss": 0.3991, "lr": 2.014189549672245e-05, "epoch": 2.73620253164557, "percentage": 54.8, "elapsed_time": "6:00:21", "remaining_time": "4:57:16"}
675
+ {"current_steps": 675, "total_steps": 1230, "loss": 0.3971, "lr": 2.0085137755158776e-05, "epoch": 2.740253164556962, "percentage": 54.88, "elapsed_time": "6:00:56", "remaining_time": "4:56:46"}
676
+ {"current_steps": 676, "total_steps": 1230, "loss": 0.3826, "lr": 2.0028379327907327e-05, "epoch": 2.7443037974683544, "percentage": 54.96, "elapsed_time": "6:01:29", "remaining_time": "4:56:15"}
677
+ {"current_steps": 677, "total_steps": 1230, "loss": 0.3892, "lr": 1.9971620672092676e-05, "epoch": 2.748354430379747, "percentage": 55.04, "elapsed_time": "6:02:05", "remaining_time": "4:55:46"}
678
+ {"current_steps": 678, "total_steps": 1230, "loss": 0.3892, "lr": 1.991486224484123e-05, "epoch": 2.752405063291139, "percentage": 55.12, "elapsed_time": "6:02:43", "remaining_time": "4:55:19"}
679
+ {"current_steps": 679, "total_steps": 1230, "loss": 0.3954, "lr": 1.985810450327756e-05, "epoch": 2.7564556962025315, "percentage": 55.2, "elapsed_time": "6:03:12", "remaining_time": "4:54:44"}
680
+ {"current_steps": 680, "total_steps": 1230, "loss": 0.3766, "lr": 1.9801347904520706e-05, "epoch": 2.760506329113924, "percentage": 55.28, "elapsed_time": "6:03:51", "remaining_time": "4:54:17"}
681
+ {"current_steps": 681, "total_steps": 1230, "loss": 0.3483, "lr": 1.974459290568053e-05, "epoch": 2.7645569620253165, "percentage": 55.37, "elapsed_time": "6:04:19", "remaining_time": "4:53:42"}
682
+ {"current_steps": 682, "total_steps": 1230, "loss": 0.3766, "lr": 1.968783996385397e-05, "epoch": 2.768607594936709, "percentage": 55.45, "elapsed_time": "6:04:49", "remaining_time": "4:53:08"}
683
+ {"current_steps": 683, "total_steps": 1230, "loss": 0.3832, "lr": 1.963108953612143e-05, "epoch": 2.772658227848101, "percentage": 55.53, "elapsed_time": "6:05:19", "remaining_time": "4:52:34"}
684
+ {"current_steps": 684, "total_steps": 1230, "loss": 0.3802, "lr": 1.9574342079543056e-05, "epoch": 2.7767088607594936, "percentage": 55.61, "elapsed_time": "6:05:49", "remaining_time": "4:52:00"}
685
+ {"current_steps": 685, "total_steps": 1230, "loss": 0.3658, "lr": 1.9517598051155046e-05, "epoch": 2.780759493670886, "percentage": 55.69, "elapsed_time": "6:06:17", "remaining_time": "4:51:25"}
686
+ {"current_steps": 686, "total_steps": 1230, "loss": 0.3785, "lr": 1.9460857907966025e-05, "epoch": 2.7848101265822782, "percentage": 55.77, "elapsed_time": "6:06:44", "remaining_time": "4:50:49"}
687
+ {"current_steps": 687, "total_steps": 1230, "loss": 0.3675, "lr": 1.9404122106953285e-05, "epoch": 2.7888607594936707, "percentage": 55.85, "elapsed_time": "6:07:20", "remaining_time": "4:50:20"}
688
+ {"current_steps": 688, "total_steps": 1230, "loss": 0.3777, "lr": 1.9347391105059176e-05, "epoch": 2.7929113924050633, "percentage": 55.93, "elapsed_time": "6:07:52", "remaining_time": "4:49:48"}
689
+ {"current_steps": 689, "total_steps": 1230, "loss": 0.3984, "lr": 1.92906653591874e-05, "epoch": 2.7969620253164558, "percentage": 56.02, "elapsed_time": "6:08:21", "remaining_time": "4:49:14"}
690
+ {"current_steps": 690, "total_steps": 1230, "loss": 0.4042, "lr": 1.9233945326199295e-05, "epoch": 2.8010126582278483, "percentage": 56.1, "elapsed_time": "6:08:59", "remaining_time": "4:48:46"}
691
+ {"current_steps": 691, "total_steps": 1230, "loss": 0.3992, "lr": 1.917723146291022e-05, "epoch": 2.8050632911392404, "percentage": 56.18, "elapsed_time": "6:09:25", "remaining_time": "4:48:10"}
692
+ {"current_steps": 692, "total_steps": 1230, "loss": 0.3732, "lr": 1.912052422608584e-05, "epoch": 2.809113924050633, "percentage": 56.26, "elapsed_time": "6:09:54", "remaining_time": "4:47:35"}
693
+ {"current_steps": 693, "total_steps": 1230, "loss": 0.3931, "lr": 1.9063824072438428e-05, "epoch": 2.8131645569620254, "percentage": 56.34, "elapsed_time": "6:10:26", "remaining_time": "4:47:02"}
694
+ {"current_steps": 694, "total_steps": 1230, "loss": 0.3938, "lr": 1.9007131458623246e-05, "epoch": 2.8172151898734175, "percentage": 56.42, "elapsed_time": "6:11:00", "remaining_time": "4:46:32"}
695
+ {"current_steps": 695, "total_steps": 1230, "loss": 0.3861, "lr": 1.895044684123479e-05, "epoch": 2.82126582278481, "percentage": 56.5, "elapsed_time": "6:11:36", "remaining_time": "4:46:03"}
696
+ {"current_steps": 696, "total_steps": 1230, "loss": 0.3781, "lr": 1.8893770676803194e-05, "epoch": 2.8253164556962025, "percentage": 56.59, "elapsed_time": "6:12:07", "remaining_time": "4:45:30"}
697
+ {"current_steps": 697, "total_steps": 1230, "loss": 0.3866, "lr": 1.8837103421790486e-05, "epoch": 2.829367088607595, "percentage": 56.67, "elapsed_time": "6:12:40", "remaining_time": "4:44:58"}
698
+ {"current_steps": 698, "total_steps": 1230, "loss": 0.3805, "lr": 1.8780445532586952e-05, "epoch": 2.8334177215189875, "percentage": 56.75, "elapsed_time": "6:13:15", "remaining_time": "4:44:29"}
699
+ {"current_steps": 699, "total_steps": 1230, "loss": 0.3602, "lr": 1.872379746550743e-05, "epoch": 2.8374683544303796, "percentage": 56.83, "elapsed_time": "6:13:50", "remaining_time": "4:43:59"}
700
+ {"current_steps": 700, "total_steps": 1230, "loss": 0.3738, "lr": 1.866715967678769e-05, "epoch": 2.841518987341772, "percentage": 56.91, "elapsed_time": "6:14:21", "remaining_time": "4:43:26"}
701
+ {"current_steps": 701, "total_steps": 1230, "loss": 0.3685, "lr": 1.861053262258067e-05, "epoch": 2.8455696202531646, "percentage": 56.99, "elapsed_time": "6:14:50", "remaining_time": "4:42:52"}
702
+ {"current_steps": 702, "total_steps": 1230, "loss": 0.3838, "lr": 1.8553916758952897e-05, "epoch": 2.8496202531645567, "percentage": 57.07, "elapsed_time": "6:15:22", "remaining_time": "4:42:20"}
703
+ {"current_steps": 703, "total_steps": 1230, "loss": 0.3897, "lr": 1.8497312541880735e-05, "epoch": 2.853670886075949, "percentage": 57.15, "elapsed_time": "6:15:51", "remaining_time": "4:41:45"}
704
+ {"current_steps": 704, "total_steps": 1230, "loss": 0.3615, "lr": 1.8440720427246786e-05, "epoch": 2.8577215189873417, "percentage": 57.24, "elapsed_time": "6:16:23", "remaining_time": "4:41:13"}
705
+ {"current_steps": 705, "total_steps": 1230, "loss": 0.3972, "lr": 1.8384140870836157e-05, "epoch": 2.8617721518987342, "percentage": 57.32, "elapsed_time": "6:16:51", "remaining_time": "4:40:38"}
706
+ {"current_steps": 706, "total_steps": 1230, "loss": 0.3812, "lr": 1.8327574328332806e-05, "epoch": 2.8658227848101268, "percentage": 57.4, "elapsed_time": "6:17:21", "remaining_time": "4:40:04"}
707
+ {"current_steps": 707, "total_steps": 1230, "loss": 0.3639, "lr": 1.8271021255315906e-05, "epoch": 2.869873417721519, "percentage": 57.48, "elapsed_time": "6:17:52", "remaining_time": "4:39:32"}
708
+ {"current_steps": 708, "total_steps": 1230, "loss": 0.3967, "lr": 1.8214482107256117e-05, "epoch": 2.8739240506329113, "percentage": 57.56, "elapsed_time": "6:18:27", "remaining_time": "4:39:02"}
709
+ {"current_steps": 709, "total_steps": 1230, "loss": 0.3792, "lr": 1.8157957339511968e-05, "epoch": 2.877974683544304, "percentage": 57.64, "elapsed_time": "6:18:58", "remaining_time": "4:38:28"}
710
+ {"current_steps": 710, "total_steps": 1230, "loss": 0.3948, "lr": 1.8101447407326182e-05, "epoch": 2.882025316455696, "percentage": 57.72, "elapsed_time": "6:19:30", "remaining_time": "4:37:56"}
711
+ {"current_steps": 711, "total_steps": 1230, "loss": 0.3968, "lr": 1.8044952765821966e-05, "epoch": 2.8860759493670884, "percentage": 57.8, "elapsed_time": "6:20:05", "remaining_time": "4:37:27"}
712
+ {"current_steps": 712, "total_steps": 1230, "loss": 0.374, "lr": 1.7988473869999407e-05, "epoch": 2.890126582278481, "percentage": 57.89, "elapsed_time": "6:20:39", "remaining_time": "4:36:56"}
713
+ {"current_steps": 713, "total_steps": 1230, "loss": 0.396, "lr": 1.7932011174731764e-05, "epoch": 2.8941772151898735, "percentage": 57.97, "elapsed_time": "6:21:13", "remaining_time": "4:36:25"}
714
+ {"current_steps": 714, "total_steps": 1230, "loss": 0.3799, "lr": 1.7875565134761817e-05, "epoch": 2.898227848101266, "percentage": 58.05, "elapsed_time": "6:21:46", "remaining_time": "4:35:54"}
715
+ {"current_steps": 715, "total_steps": 1230, "loss": 0.4031, "lr": 1.7819136204698226e-05, "epoch": 2.902278481012658, "percentage": 58.13, "elapsed_time": "6:22:19", "remaining_time": "4:35:23"}
716
+ {"current_steps": 716, "total_steps": 1230, "loss": 0.3889, "lr": 1.776272483901182e-05, "epoch": 2.9063291139240506, "percentage": 58.21, "elapsed_time": "6:22:55", "remaining_time": "4:34:53"}
717
+ {"current_steps": 717, "total_steps": 1230, "loss": 0.3855, "lr": 1.7706331492031995e-05, "epoch": 2.910379746835443, "percentage": 58.29, "elapsed_time": "6:23:25", "remaining_time": "4:34:19"}
718
+ {"current_steps": 718, "total_steps": 1230, "loss": 0.3688, "lr": 1.764995661794301e-05, "epoch": 2.9144303797468356, "percentage": 58.37, "elapsed_time": "6:23:58", "remaining_time": "4:33:48"}
719
+ {"current_steps": 719, "total_steps": 1230, "loss": 0.3658, "lr": 1.759360067078035e-05, "epoch": 2.918481012658228, "percentage": 58.46, "elapsed_time": "6:24:26", "remaining_time": "4:33:13"}
720
+ {"current_steps": 720, "total_steps": 1230, "loss": 0.3902, "lr": 1.7537264104427064e-05, "epoch": 2.92253164556962, "percentage": 58.54, "elapsed_time": "6:24:57", "remaining_time": "4:32:41"}
721
+ {"current_steps": 721, "total_steps": 1230, "loss": 0.3913, "lr": 1.748094737261012e-05, "epoch": 2.9265822784810127, "percentage": 58.62, "elapsed_time": "6:25:28", "remaining_time": "4:32:07"}
722
+ {"current_steps": 722, "total_steps": 1230, "loss": 0.3877, "lr": 1.7424650928896726e-05, "epoch": 2.9306329113924052, "percentage": 58.7, "elapsed_time": "6:26:01", "remaining_time": "4:31:36"}
723
+ {"current_steps": 723, "total_steps": 1230, "loss": 0.3883, "lr": 1.7368375226690712e-05, "epoch": 2.9346835443037973, "percentage": 58.78, "elapsed_time": "6:26:38", "remaining_time": "4:31:07"}
724
+ {"current_steps": 724, "total_steps": 1230, "loss": 0.3515, "lr": 1.731212071922883e-05, "epoch": 2.93873417721519, "percentage": 58.86, "elapsed_time": "6:27:05", "remaining_time": "4:30:32"}
725
+ {"current_steps": 725, "total_steps": 1230, "loss": 0.3637, "lr": 1.7255887859577156e-05, "epoch": 2.9427848101265823, "percentage": 58.94, "elapsed_time": "6:27:34", "remaining_time": "4:29:58"}
726
+ {"current_steps": 726, "total_steps": 1230, "loss": 0.3836, "lr": 1.7199677100627427e-05, "epoch": 2.946835443037975, "percentage": 59.02, "elapsed_time": "6:28:06", "remaining_time": "4:29:25"}
727
+ {"current_steps": 727, "total_steps": 1230, "loss": 0.3942, "lr": 1.7143488895093343e-05, "epoch": 2.9508860759493674, "percentage": 59.11, "elapsed_time": "6:28:37", "remaining_time": "4:28:53"}
728
+ {"current_steps": 728, "total_steps": 1230, "loss": 0.3725, "lr": 1.7087323695506994e-05, "epoch": 2.9549367088607594, "percentage": 59.19, "elapsed_time": "6:29:13", "remaining_time": "4:28:23"}
729
+ {"current_steps": 729, "total_steps": 1230, "loss": 0.377, "lr": 1.7031181954215194e-05, "epoch": 2.958987341772152, "percentage": 59.27, "elapsed_time": "6:29:45", "remaining_time": "4:27:51"}
730
+ {"current_steps": 730, "total_steps": 1230, "loss": 0.4016, "lr": 1.6975064123375788e-05, "epoch": 2.9630379746835445, "percentage": 59.35, "elapsed_time": "6:30:19", "remaining_time": "4:27:20"}
731
+ {"current_steps": 731, "total_steps": 1230, "loss": 0.3975, "lr": 1.6918970654954084e-05, "epoch": 2.9670886075949365, "percentage": 59.43, "elapsed_time": "6:30:51", "remaining_time": "4:26:48"}
732
+ {"current_steps": 732, "total_steps": 1230, "loss": 0.3771, "lr": 1.686290200071915e-05, "epoch": 2.971139240506329, "percentage": 59.51, "elapsed_time": "6:31:19", "remaining_time": "4:26:13"}
733
+ {"current_steps": 733, "total_steps": 1230, "loss": 0.3851, "lr": 1.6806858612240234e-05, "epoch": 2.9751898734177216, "percentage": 59.59, "elapsed_time": "6:31:51", "remaining_time": "4:25:41"}
734
+ {"current_steps": 734, "total_steps": 1230, "loss": 0.3764, "lr": 1.6750840940883078e-05, "epoch": 2.979240506329114, "percentage": 59.67, "elapsed_time": "6:32:23", "remaining_time": "4:25:09"}
735
+ {"current_steps": 735, "total_steps": 1230, "loss": 0.3712, "lr": 1.6694849437806305e-05, "epoch": 2.9832911392405066, "percentage": 59.76, "elapsed_time": "6:32:47", "remaining_time": "4:24:32"}
736
+ {"current_steps": 736, "total_steps": 1230, "loss": 0.3734, "lr": 1.663888455395778e-05, "epoch": 2.9873417721518987, "percentage": 59.84, "elapsed_time": "6:33:16", "remaining_time": "4:23:57"}
737
+ {"current_steps": 737, "total_steps": 1230, "loss": 0.3844, "lr": 1.6582946740070995e-05, "epoch": 2.991392405063291, "percentage": 59.92, "elapsed_time": "6:33:51", "remaining_time": "4:23:27"}
738
+ {"current_steps": 738, "total_steps": 1230, "loss": 0.3925, "lr": 1.6527036446661396e-05, "epoch": 2.9954430379746837, "percentage": 60.0, "elapsed_time": "6:34:28", "remaining_time": "4:22:58"}
739
+ {"current_steps": 739, "total_steps": 1230, "loss": 0.3444, "lr": 1.6471154124022818e-05, "epoch": 3.0025316455696203, "percentage": 60.08, "elapsed_time": "6:36:52", "remaining_time": "4:23:41"}
740
+ {"current_steps": 740, "total_steps": 1230, "loss": 0.2834, "lr": 1.6415300222223788e-05, "epoch": 3.006582278481013, "percentage": 60.16, "elapsed_time": "6:37:27", "remaining_time": "4:23:11"}
741
+ {"current_steps": 741, "total_steps": 1230, "loss": 0.262, "lr": 1.6359475191103958e-05, "epoch": 3.010632911392405, "percentage": 60.24, "elapsed_time": "6:37:57", "remaining_time": "4:22:37"}
742
+ {"current_steps": 742, "total_steps": 1230, "loss": 0.2802, "lr": 1.6303679480270466e-05, "epoch": 3.0146835443037974, "percentage": 60.33, "elapsed_time": "6:38:28", "remaining_time": "4:22:04"}
743
+ {"current_steps": 743, "total_steps": 1230, "loss": 0.2635, "lr": 1.624791353909428e-05, "epoch": 3.01873417721519, "percentage": 60.41, "elapsed_time": "6:39:07", "remaining_time": "4:21:36"}