yuzhounie commited on
Commit
05aa47c
·
verified ·
1 Parent(s): 05117d4

Training in progress, step 2000

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b2571dcb4a687334c0a0e58557cd7a648f1de6e2012b82a95a174fd838d87143
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fa11074c498b250c34e1135b3445b223c0c417f9aa0c3cd6a9f1eaeec3c4c38
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:cd2107ae35ad3e41b536ee6ce09709f2aeee6cd05e541e5b1e63fc66a78b756c
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:99af590ec7d10a28ed2bb9377151b223d457865838ddaeba02af87b957016b92
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:568e3aac7cb5ad9a110860dde155e0b9c3de0b056d53f8f0707d6591adeb4855
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:293a6404fef7572a626ff113ae5291fd1eb30fec9b0c9711eb55ed9300af7dc3
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a4fb04812f542fef2978558a2e12e6bf2125ca8d95ca08e36fd3363c6aff6ac4
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32472c1723b04ff03a6f981edeee009a11ac05478f1fca736842d8a3cdbeb2ac
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -1620,3 +1620,427 @@
1620
  {"current_steps": 1620, "total_steps": 2148, "loss": 0.2219, "lr": 1.7368767540484965e-06, "epoch": 2.2622645896303184, "percentage": 75.42, "elapsed_time": "3:46:04", "remaining_time": "1:13:41"}
1621
  {"current_steps": 1621, "total_steps": 2148, "loss": 0.2537, "lr": 1.7307239886699546e-06, "epoch": 2.2636596140432457, "percentage": 75.47, "elapsed_time": "3:46:10", "remaining_time": "1:13:32"}
1622
  {"current_steps": 1622, "total_steps": 2148, "loss": 0.2409, "lr": 1.7245798587922263e-06, "epoch": 2.265054638456173, "percentage": 75.51, "elapsed_time": "3:46:17", "remaining_time": "1:13:22"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1620
  {"current_steps": 1620, "total_steps": 2148, "loss": 0.2219, "lr": 1.7368767540484965e-06, "epoch": 2.2622645896303184, "percentage": 75.42, "elapsed_time": "3:46:04", "remaining_time": "1:13:41"}
1621
  {"current_steps": 1621, "total_steps": 2148, "loss": 0.2537, "lr": 1.7307239886699546e-06, "epoch": 2.2636596140432457, "percentage": 75.47, "elapsed_time": "3:46:10", "remaining_time": "1:13:32"}
1622
  {"current_steps": 1622, "total_steps": 2148, "loss": 0.2409, "lr": 1.7245798587922263e-06, "epoch": 2.265054638456173, "percentage": 75.51, "elapsed_time": "3:46:17", "remaining_time": "1:13:22"}
1623
+ {"current_steps": 1623, "total_steps": 2148, "loss": 0.2273, "lr": 1.7184443806444851e-06, "epoch": 2.2664496628691, "percentage": 75.56, "elapsed_time": "3:46:27", "remaining_time": "1:13:15"}
1624
+ {"current_steps": 1624, "total_steps": 2148, "loss": 0.2189, "lr": 1.7123175704330514e-06, "epoch": 2.2678446872820275, "percentage": 75.61, "elapsed_time": "3:46:34", "remaining_time": "1:13:06"}
1625
+ {"current_steps": 1625, "total_steps": 2148, "loss": 0.2403, "lr": 1.706199444341341e-06, "epoch": 2.2692397116949548, "percentage": 75.65, "elapsed_time": "3:46:43", "remaining_time": "1:12:58"}
1626
+ {"current_steps": 1626, "total_steps": 2148, "loss": 0.273, "lr": 1.7000900185298418e-06, "epoch": 2.270634736107882, "percentage": 75.7, "elapsed_time": "3:46:49", "remaining_time": "1:12:49"}
1627
+ {"current_steps": 1627, "total_steps": 2148, "loss": 0.2631, "lr": 1.6939893091360577e-06, "epoch": 2.2720297605208093, "percentage": 75.74, "elapsed_time": "3:47:01", "remaining_time": "1:12:41"}
1628
+ {"current_steps": 1628, "total_steps": 2148, "loss": 0.2259, "lr": 1.6878973322744658e-06, "epoch": 2.273424784933736, "percentage": 75.79, "elapsed_time": "3:47:07", "remaining_time": "1:12:32"}
1629
+ {"current_steps": 1629, "total_steps": 2148, "loss": 0.2286, "lr": 1.6818141040364816e-06, "epoch": 2.2748198093466634, "percentage": 75.84, "elapsed_time": "3:47:14", "remaining_time": "1:12:24"}
1630
+ {"current_steps": 1630, "total_steps": 2148, "loss": 0.2257, "lr": 1.6757396404904087e-06, "epoch": 2.2762148337595907, "percentage": 75.88, "elapsed_time": "3:47:21", "remaining_time": "1:12:15"}
1631
+ {"current_steps": 1631, "total_steps": 2148, "loss": 0.24, "lr": 1.6696739576813981e-06, "epoch": 2.277609858172518, "percentage": 75.93, "elapsed_time": "3:47:31", "remaining_time": "1:12:07"}
1632
+ {"current_steps": 1632, "total_steps": 2148, "loss": 0.2641, "lr": 1.6636170716314114e-06, "epoch": 2.279004882585445, "percentage": 75.98, "elapsed_time": "3:47:38", "remaining_time": "1:11:58"}
1633
+ {"current_steps": 1633, "total_steps": 2148, "loss": 0.2624, "lr": 1.657568998339175e-06, "epoch": 2.2803999069983725, "percentage": 76.02, "elapsed_time": "3:47:44", "remaining_time": "1:11:49"}
1634
+ {"current_steps": 1634, "total_steps": 2148, "loss": 0.2485, "lr": 1.6515297537801305e-06, "epoch": 2.2817949314112997, "percentage": 76.07, "elapsed_time": "3:47:50", "remaining_time": "1:11:40"}
1635
+ {"current_steps": 1635, "total_steps": 2148, "loss": 0.2178, "lr": 1.6454993539064075e-06, "epoch": 2.283189955824227, "percentage": 76.12, "elapsed_time": "3:47:57", "remaining_time": "1:11:31"}
1636
+ {"current_steps": 1636, "total_steps": 2148, "loss": 0.2687, "lr": 1.6394778146467672e-06, "epoch": 2.2845849802371543, "percentage": 76.16, "elapsed_time": "3:48:09", "remaining_time": "1:11:24"}
1637
+ {"current_steps": 1637, "total_steps": 2148, "loss": 0.2558, "lr": 1.6334651519065658e-06, "epoch": 2.2859800046500816, "percentage": 76.21, "elapsed_time": "3:48:16", "remaining_time": "1:11:15"}
1638
+ {"current_steps": 1638, "total_steps": 2148, "loss": 0.2441, "lr": 1.6274613815677176e-06, "epoch": 2.287375029063009, "percentage": 76.26, "elapsed_time": "3:48:25", "remaining_time": "1:11:07"}
1639
+ {"current_steps": 1639, "total_steps": 2148, "loss": 0.1963, "lr": 1.6214665194886474e-06, "epoch": 2.2887700534759357, "percentage": 76.3, "elapsed_time": "3:48:34", "remaining_time": "1:10:59"}
1640
+ {"current_steps": 1640, "total_steps": 2148, "loss": 0.2092, "lr": 1.6154805815042457e-06, "epoch": 2.290165077888863, "percentage": 76.35, "elapsed_time": "3:48:42", "remaining_time": "1:10:50"}
1641
+ {"current_steps": 1641, "total_steps": 2148, "loss": 0.2485, "lr": 1.6095035834258365e-06, "epoch": 2.29156010230179, "percentage": 76.4, "elapsed_time": "3:48:48", "remaining_time": "1:10:41"}
1642
+ {"current_steps": 1642, "total_steps": 2148, "loss": 0.1996, "lr": 1.6035355410411252e-06, "epoch": 2.2929551267147175, "percentage": 76.44, "elapsed_time": "3:48:55", "remaining_time": "1:10:32"}
1643
+ {"current_steps": 1643, "total_steps": 2148, "loss": 0.2359, "lr": 1.5975764701141611e-06, "epoch": 2.2943501511276447, "percentage": 76.49, "elapsed_time": "3:49:05", "remaining_time": "1:10:24"}
1644
+ {"current_steps": 1644, "total_steps": 2148, "loss": 0.2416, "lr": 1.5916263863853e-06, "epoch": 2.295745175540572, "percentage": 76.54, "elapsed_time": "3:49:15", "remaining_time": "1:10:17"}
1645
+ {"current_steps": 1645, "total_steps": 2148, "loss": 0.2625, "lr": 1.585685305571159e-06, "epoch": 2.2971401999534993, "percentage": 76.58, "elapsed_time": "3:49:24", "remaining_time": "1:10:08"}
1646
+ {"current_steps": 1646, "total_steps": 2148, "loss": 0.2271, "lr": 1.5797532433645696e-06, "epoch": 2.2985352243664265, "percentage": 76.63, "elapsed_time": "3:49:33", "remaining_time": "1:10:00"}
1647
+ {"current_steps": 1647, "total_steps": 2148, "loss": 0.2363, "lr": 1.5738302154345475e-06, "epoch": 2.299930248779354, "percentage": 76.68, "elapsed_time": "3:49:46", "remaining_time": "1:09:53"}
1648
+ {"current_steps": 1648, "total_steps": 2148, "loss": 0.2319, "lr": 1.5679162374262414e-06, "epoch": 2.3013252731922806, "percentage": 76.72, "elapsed_time": "3:49:53", "remaining_time": "1:09:44"}
1649
+ {"current_steps": 1649, "total_steps": 2148, "loss": 0.2536, "lr": 1.5620113249608943e-06, "epoch": 2.302720297605208, "percentage": 76.77, "elapsed_time": "3:49:59", "remaining_time": "1:09:35"}
1650
+ {"current_steps": 1650, "total_steps": 2148, "loss": 0.2379, "lr": 1.5561154936358069e-06, "epoch": 2.304115322018135, "percentage": 76.82, "elapsed_time": "3:50:09", "remaining_time": "1:09:28"}
1651
+ {"current_steps": 1651, "total_steps": 2148, "loss": 0.2285, "lr": 1.5502287590242942e-06, "epoch": 2.3055103464310625, "percentage": 76.86, "elapsed_time": "3:50:17", "remaining_time": "1:09:19"}
1652
+ {"current_steps": 1652, "total_steps": 2148, "loss": 0.2168, "lr": 1.5443511366756375e-06, "epoch": 2.3069053708439897, "percentage": 76.91, "elapsed_time": "3:50:24", "remaining_time": "1:09:10"}
1653
+ {"current_steps": 1653, "total_steps": 2148, "loss": 0.2428, "lr": 1.53848264211505e-06, "epoch": 2.308300395256917, "percentage": 76.96, "elapsed_time": "3:50:31", "remaining_time": "1:09:01"}
1654
+ {"current_steps": 1654, "total_steps": 2148, "loss": 0.2132, "lr": 1.5326232908436405e-06, "epoch": 2.3096954196698443, "percentage": 77.0, "elapsed_time": "3:50:39", "remaining_time": "1:08:53"}
1655
+ {"current_steps": 1655, "total_steps": 2148, "loss": 0.2326, "lr": 1.526773098338359e-06, "epoch": 2.3110904440827715, "percentage": 77.05, "elapsed_time": "3:50:47", "remaining_time": "1:08:45"}
1656
+ {"current_steps": 1656, "total_steps": 2148, "loss": 0.2299, "lr": 1.5209320800519683e-06, "epoch": 2.312485468495699, "percentage": 77.09, "elapsed_time": "3:50:55", "remaining_time": "1:08:36"}
1657
+ {"current_steps": 1657, "total_steps": 2148, "loss": 0.2514, "lr": 1.515100251412998e-06, "epoch": 2.313880492908626, "percentage": 77.14, "elapsed_time": "3:51:05", "remaining_time": "1:08:28"}
1658
+ {"current_steps": 1658, "total_steps": 2148, "loss": 0.2269, "lr": 1.5092776278257027e-06, "epoch": 2.3152755173215533, "percentage": 77.19, "elapsed_time": "3:51:18", "remaining_time": "1:08:21"}
1659
+ {"current_steps": 1659, "total_steps": 2148, "loss": 0.239, "lr": 1.5034642246700203e-06, "epoch": 2.31667054173448, "percentage": 77.23, "elapsed_time": "3:51:27", "remaining_time": "1:08:13"}
1660
+ {"current_steps": 1660, "total_steps": 2148, "loss": 0.2503, "lr": 1.4976600573015398e-06, "epoch": 2.3180655661474074, "percentage": 77.28, "elapsed_time": "3:51:34", "remaining_time": "1:08:04"}
1661
+ {"current_steps": 1661, "total_steps": 2148, "loss": 0.2497, "lr": 1.4918651410514479e-06, "epoch": 2.3194605905603347, "percentage": 77.33, "elapsed_time": "3:51:43", "remaining_time": "1:07:56"}
1662
+ {"current_steps": 1662, "total_steps": 2148, "loss": 0.2209, "lr": 1.486079491226501e-06, "epoch": 2.320855614973262, "percentage": 77.37, "elapsed_time": "3:51:49", "remaining_time": "1:07:47"}
1663
+ {"current_steps": 1663, "total_steps": 2148, "loss": 0.232, "lr": 1.4803031231089782e-06, "epoch": 2.3222506393861893, "percentage": 77.42, "elapsed_time": "3:52:00", "remaining_time": "1:07:39"}
1664
+ {"current_steps": 1664, "total_steps": 2148, "loss": 0.2228, "lr": 1.4745360519566382e-06, "epoch": 2.3236456637991165, "percentage": 77.47, "elapsed_time": "3:52:09", "remaining_time": "1:07:31"}
1665
+ {"current_steps": 1665, "total_steps": 2148, "loss": 0.2503, "lr": 1.4687782930026833e-06, "epoch": 2.325040688212044, "percentage": 77.51, "elapsed_time": "3:52:16", "remaining_time": "1:07:22"}
1666
+ {"current_steps": 1666, "total_steps": 2148, "loss": 0.2293, "lr": 1.4630298614557236e-06, "epoch": 2.326435712624971, "percentage": 77.56, "elapsed_time": "3:52:22", "remaining_time": "1:07:13"}
1667
+ {"current_steps": 1667, "total_steps": 2148, "loss": 0.2745, "lr": 1.4572907724997249e-06, "epoch": 2.3278307370378983, "percentage": 77.61, "elapsed_time": "3:52:32", "remaining_time": "1:07:05"}
1668
+ {"current_steps": 1668, "total_steps": 2148, "loss": 0.22, "lr": 1.4515610412939791e-06, "epoch": 2.329225761450825, "percentage": 77.65, "elapsed_time": "3:52:39", "remaining_time": "1:06:57"}
1669
+ {"current_steps": 1669, "total_steps": 2148, "loss": 0.2416, "lr": 1.445840682973062e-06, "epoch": 2.3306207858637524, "percentage": 77.7, "elapsed_time": "3:52:45", "remaining_time": "1:06:48"}
1670
+ {"current_steps": 1670, "total_steps": 2148, "loss": 0.2087, "lr": 1.4401297126467884e-06, "epoch": 2.3320158102766797, "percentage": 77.75, "elapsed_time": "3:52:52", "remaining_time": "1:06:39"}
1671
+ {"current_steps": 1671, "total_steps": 2148, "loss": 0.2045, "lr": 1.4344281454001751e-06, "epoch": 2.333410834689607, "percentage": 77.79, "elapsed_time": "3:53:01", "remaining_time": "1:06:31"}
1672
+ {"current_steps": 1672, "total_steps": 2148, "loss": 0.2466, "lr": 1.4287359962934055e-06, "epoch": 2.3348058591025342, "percentage": 77.84, "elapsed_time": "3:53:09", "remaining_time": "1:06:22"}
1673
+ {"current_steps": 1673, "total_steps": 2148, "loss": 0.249, "lr": 1.4230532803617814e-06, "epoch": 2.3362008835154615, "percentage": 77.89, "elapsed_time": "3:53:19", "remaining_time": "1:06:14"}
1674
+ {"current_steps": 1674, "total_steps": 2148, "loss": 0.2427, "lr": 1.4173800126156916e-06, "epoch": 2.337595907928389, "percentage": 77.93, "elapsed_time": "3:53:25", "remaining_time": "1:06:05"}
1675
+ {"current_steps": 1675, "total_steps": 2148, "loss": 0.224, "lr": 1.411716208040566e-06, "epoch": 2.338990932341316, "percentage": 77.98, "elapsed_time": "3:53:33", "remaining_time": "1:05:57"}
1676
+ {"current_steps": 1676, "total_steps": 2148, "loss": 0.2487, "lr": 1.4060618815968375e-06, "epoch": 2.3403859567542433, "percentage": 78.03, "elapsed_time": "3:53:41", "remaining_time": "1:05:48"}
1677
+ {"current_steps": 1677, "total_steps": 2148, "loss": 0.2616, "lr": 1.4004170482199054e-06, "epoch": 2.3417809811671706, "percentage": 78.07, "elapsed_time": "3:53:50", "remaining_time": "1:05:40"}
1678
+ {"current_steps": 1678, "total_steps": 2148, "loss": 0.2101, "lr": 1.3947817228200956e-06, "epoch": 2.343176005580098, "percentage": 78.12, "elapsed_time": "3:53:56", "remaining_time": "1:05:31"}
1679
+ {"current_steps": 1679, "total_steps": 2148, "loss": 0.2634, "lr": 1.3891559202826133e-06, "epoch": 2.3445710299930247, "percentage": 78.17, "elapsed_time": "3:54:04", "remaining_time": "1:05:23"}
1680
+ {"current_steps": 1680, "total_steps": 2148, "loss": 0.2358, "lr": 1.3835396554675179e-06, "epoch": 2.345966054405952, "percentage": 78.21, "elapsed_time": "3:54:12", "remaining_time": "1:05:14"}
1681
+ {"current_steps": 1681, "total_steps": 2148, "loss": 0.261, "lr": 1.37793294320967e-06, "epoch": 2.3473610788188792, "percentage": 78.26, "elapsed_time": "3:54:19", "remaining_time": "1:05:05"}
1682
+ {"current_steps": 1682, "total_steps": 2148, "loss": 0.2166, "lr": 1.3723357983186974e-06, "epoch": 2.3487561032318065, "percentage": 78.31, "elapsed_time": "3:54:26", "remaining_time": "1:04:57"}
1683
+ {"current_steps": 1683, "total_steps": 2148, "loss": 0.2259, "lr": 1.3667482355789607e-06, "epoch": 2.3501511276447338, "percentage": 78.35, "elapsed_time": "3:54:33", "remaining_time": "1:04:48"}
1684
+ {"current_steps": 1684, "total_steps": 2148, "loss": 0.2127, "lr": 1.3611702697495088e-06, "epoch": 2.351546152057661, "percentage": 78.4, "elapsed_time": "3:54:40", "remaining_time": "1:04:39"}
1685
+ {"current_steps": 1685, "total_steps": 2148, "loss": 0.2327, "lr": 1.3556019155640416e-06, "epoch": 2.3529411764705883, "percentage": 78.45, "elapsed_time": "3:54:49", "remaining_time": "1:04:31"}
1686
+ {"current_steps": 1686, "total_steps": 2148, "loss": 0.2382, "lr": 1.350043187730868e-06, "epoch": 2.3543362008835156, "percentage": 78.49, "elapsed_time": "3:54:57", "remaining_time": "1:04:22"}
1687
+ {"current_steps": 1687, "total_steps": 2148, "loss": 0.234, "lr": 1.34449410093287e-06, "epoch": 2.355731225296443, "percentage": 78.54, "elapsed_time": "3:55:04", "remaining_time": "1:04:14"}
1688
+ {"current_steps": 1688, "total_steps": 2148, "loss": 0.2153, "lr": 1.3389546698274686e-06, "epoch": 2.3571262497093697, "percentage": 78.58, "elapsed_time": "3:55:12", "remaining_time": "1:04:05"}
1689
+ {"current_steps": 1689, "total_steps": 2148, "loss": 0.2486, "lr": 1.333424909046574e-06, "epoch": 2.358521274122297, "percentage": 78.63, "elapsed_time": "3:55:20", "remaining_time": "1:03:57"}
1690
+ {"current_steps": 1690, "total_steps": 2148, "loss": 0.2581, "lr": 1.327904833196556e-06, "epoch": 2.359916298535224, "percentage": 78.68, "elapsed_time": "3:55:26", "remaining_time": "1:03:48"}
1691
+ {"current_steps": 1691, "total_steps": 2148, "loss": 0.2151, "lr": 1.3223944568582047e-06, "epoch": 2.3613113229481515, "percentage": 78.72, "elapsed_time": "3:55:33", "remaining_time": "1:03:39"}
1692
+ {"current_steps": 1692, "total_steps": 2148, "loss": 0.2289, "lr": 1.3168937945866861e-06, "epoch": 2.3627063473610788, "percentage": 78.77, "elapsed_time": "3:55:42", "remaining_time": "1:03:31"}
1693
+ {"current_steps": 1693, "total_steps": 2148, "loss": 0.2416, "lr": 1.311402860911507e-06, "epoch": 2.364101371774006, "percentage": 78.82, "elapsed_time": "3:55:51", "remaining_time": "1:03:23"}
1694
+ {"current_steps": 1694, "total_steps": 2148, "loss": 0.2189, "lr": 1.3059216703364814e-06, "epoch": 2.3654963961869333, "percentage": 78.86, "elapsed_time": "3:55:58", "remaining_time": "1:03:14"}
1695
+ {"current_steps": 1695, "total_steps": 2148, "loss": 0.2364, "lr": 1.3004502373396821e-06, "epoch": 2.3668914205998606, "percentage": 78.91, "elapsed_time": "3:56:06", "remaining_time": "1:03:05"}
1696
+ {"current_steps": 1696, "total_steps": 2148, "loss": 0.2428, "lr": 1.2949885763734127e-06, "epoch": 2.368286445012788, "percentage": 78.96, "elapsed_time": "3:56:12", "remaining_time": "1:02:57"}
1697
+ {"current_steps": 1697, "total_steps": 2148, "loss": 0.2219, "lr": 1.2895367018641658e-06, "epoch": 2.369681469425715, "percentage": 79.0, "elapsed_time": "3:56:19", "remaining_time": "1:02:48"}
1698
+ {"current_steps": 1698, "total_steps": 2148, "loss": 0.2582, "lr": 1.284094628212576e-06, "epoch": 2.3710764938386424, "percentage": 79.05, "elapsed_time": "3:56:27", "remaining_time": "1:02:39"}
1699
+ {"current_steps": 1699, "total_steps": 2148, "loss": 0.2196, "lr": 1.278662369793398e-06, "epoch": 2.372471518251569, "percentage": 79.1, "elapsed_time": "3:56:33", "remaining_time": "1:02:30"}
1700
+ {"current_steps": 1700, "total_steps": 2148, "loss": 0.2552, "lr": 1.273239940955459e-06, "epoch": 2.3738665426644965, "percentage": 79.14, "elapsed_time": "3:56:39", "remaining_time": "1:02:22"}
1701
+ {"current_steps": 1701, "total_steps": 2148, "loss": 0.2621, "lr": 1.267827356021618e-06, "epoch": 2.3752615670774238, "percentage": 79.19, "elapsed_time": "3:56:51", "remaining_time": "1:02:14"}
1702
+ {"current_steps": 1702, "total_steps": 2148, "loss": 0.2347, "lr": 1.2624246292887377e-06, "epoch": 2.376656591490351, "percentage": 79.24, "elapsed_time": "3:56:59", "remaining_time": "1:02:06"}
1703
+ {"current_steps": 1703, "total_steps": 2148, "loss": 0.2582, "lr": 1.2570317750276374e-06, "epoch": 2.3780516159032783, "percentage": 79.28, "elapsed_time": "3:57:06", "remaining_time": "1:01:57"}
1704
+ {"current_steps": 1704, "total_steps": 2148, "loss": 0.2473, "lr": 1.2516488074830586e-06, "epoch": 2.3794466403162056, "percentage": 79.33, "elapsed_time": "3:57:13", "remaining_time": "1:01:48"}
1705
+ {"current_steps": 1705, "total_steps": 2148, "loss": 0.2301, "lr": 1.246275740873631e-06, "epoch": 2.380841664729133, "percentage": 79.38, "elapsed_time": "3:57:19", "remaining_time": "1:01:39"}
1706
+ {"current_steps": 1706, "total_steps": 2148, "loss": 0.2533, "lr": 1.2409125893918329e-06, "epoch": 2.38223668914206, "percentage": 79.42, "elapsed_time": "3:57:29", "remaining_time": "1:01:31"}
1707
+ {"current_steps": 1707, "total_steps": 2148, "loss": 0.1988, "lr": 1.2355593672039462e-06, "epoch": 2.3836317135549874, "percentage": 79.47, "elapsed_time": "3:57:39", "remaining_time": "1:01:23"}
1708
+ {"current_steps": 1708, "total_steps": 2148, "loss": 0.2623, "lr": 1.2302160884500337e-06, "epoch": 2.385026737967914, "percentage": 79.52, "elapsed_time": "3:57:46", "remaining_time": "1:01:15"}
1709
+ {"current_steps": 1709, "total_steps": 2148, "loss": 0.2035, "lr": 1.2248827672438868e-06, "epoch": 2.3864217623808415, "percentage": 79.56, "elapsed_time": "3:57:55", "remaining_time": "1:01:06"}
1710
+ {"current_steps": 1710, "total_steps": 2148, "loss": 0.236, "lr": 1.2195594176729963e-06, "epoch": 2.3878167867937687, "percentage": 79.61, "elapsed_time": "3:58:05", "remaining_time": "1:00:59"}
1711
+ {"current_steps": 1711, "total_steps": 2148, "loss": 0.2325, "lr": 1.2142460537985168e-06, "epoch": 2.389211811206696, "percentage": 79.66, "elapsed_time": "3:58:11", "remaining_time": "1:00:50"}
1712
+ {"current_steps": 1712, "total_steps": 2148, "loss": 0.2245, "lr": 1.2089426896552265e-06, "epoch": 2.3906068356196233, "percentage": 79.7, "elapsed_time": "3:58:19", "remaining_time": "1:00:41"}
1713
+ {"current_steps": 1713, "total_steps": 2148, "loss": 0.2654, "lr": 1.2036493392514847e-06, "epoch": 2.3920018600325506, "percentage": 79.75, "elapsed_time": "3:58:26", "remaining_time": "1:00:32"}
1714
+ {"current_steps": 1714, "total_steps": 2148, "loss": 0.2071, "lr": 1.1983660165692078e-06, "epoch": 2.393396884445478, "percentage": 79.8, "elapsed_time": "3:58:32", "remaining_time": "1:00:24"}
1715
+ {"current_steps": 1715, "total_steps": 2148, "loss": 0.2438, "lr": 1.1930927355638189e-06, "epoch": 2.394791908858405, "percentage": 79.84, "elapsed_time": "3:58:42", "remaining_time": "1:00:16"}
1716
+ {"current_steps": 1716, "total_steps": 2148, "loss": 0.2314, "lr": 1.1878295101642185e-06, "epoch": 2.3961869332713324, "percentage": 79.89, "elapsed_time": "3:58:51", "remaining_time": "1:00:07"}
1717
+ {"current_steps": 1717, "total_steps": 2148, "loss": 0.2304, "lr": 1.182576354272748e-06, "epoch": 2.3975819576842596, "percentage": 79.93, "elapsed_time": "3:58:58", "remaining_time": "0:59:59"}
1718
+ {"current_steps": 1718, "total_steps": 2148, "loss": 0.226, "lr": 1.1773332817651512e-06, "epoch": 2.398976982097187, "percentage": 79.98, "elapsed_time": "3:59:08", "remaining_time": "0:59:51"}
1719
+ {"current_steps": 1719, "total_steps": 2148, "loss": 0.2132, "lr": 1.1721003064905329e-06, "epoch": 2.400372006510114, "percentage": 80.03, "elapsed_time": "3:59:15", "remaining_time": "0:59:42"}
1720
+ {"current_steps": 1720, "total_steps": 2148, "loss": 0.2419, "lr": 1.1668774422713336e-06, "epoch": 2.401767030923041, "percentage": 80.07, "elapsed_time": "3:59:22", "remaining_time": "0:59:33"}
1721
+ {"current_steps": 1721, "total_steps": 2148, "loss": 0.24, "lr": 1.1616647029032818e-06, "epoch": 2.4031620553359683, "percentage": 80.12, "elapsed_time": "3:59:36", "remaining_time": "0:59:26"}
1722
+ {"current_steps": 1722, "total_steps": 2148, "loss": 0.2309, "lr": 1.1564621021553617e-06, "epoch": 2.4045570797488955, "percentage": 80.17, "elapsed_time": "3:59:45", "remaining_time": "0:59:18"}
1723
+ {"current_steps": 1723, "total_steps": 2148, "loss": 0.2641, "lr": 1.1512696537697804e-06, "epoch": 2.405952104161823, "percentage": 80.21, "elapsed_time": "3:59:52", "remaining_time": "0:59:10"}
1724
+ {"current_steps": 1724, "total_steps": 2148, "loss": 0.2649, "lr": 1.1460873714619275e-06, "epoch": 2.40734712857475, "percentage": 80.26, "elapsed_time": "3:59:59", "remaining_time": "0:59:01"}
1725
+ {"current_steps": 1725, "total_steps": 2148, "loss": 0.2409, "lr": 1.140915268920339e-06, "epoch": 2.4087421529876774, "percentage": 80.31, "elapsed_time": "4:00:06", "remaining_time": "0:58:52"}
1726
+ {"current_steps": 1726, "total_steps": 2148, "loss": 0.2245, "lr": 1.13575335980666e-06, "epoch": 2.4101371774006046, "percentage": 80.35, "elapsed_time": "4:00:12", "remaining_time": "0:58:43"}
1727
+ {"current_steps": 1727, "total_steps": 2148, "loss": 0.2241, "lr": 1.130601657755616e-06, "epoch": 2.411532201813532, "percentage": 80.4, "elapsed_time": "4:00:22", "remaining_time": "0:58:35"}
1728
+ {"current_steps": 1728, "total_steps": 2148, "loss": 0.2287, "lr": 1.125460176374965e-06, "epoch": 2.4129272262264587, "percentage": 80.45, "elapsed_time": "4:00:28", "remaining_time": "0:58:27"}
1729
+ {"current_steps": 1729, "total_steps": 2148, "loss": 0.2544, "lr": 1.1203289292454728e-06, "epoch": 2.414322250639386, "percentage": 80.49, "elapsed_time": "4:00:36", "remaining_time": "0:58:18"}
1730
+ {"current_steps": 1730, "total_steps": 2148, "loss": 0.2478, "lr": 1.1152079299208724e-06, "epoch": 2.4157172750523133, "percentage": 80.54, "elapsed_time": "4:00:47", "remaining_time": "0:58:10"}
1731
+ {"current_steps": 1731, "total_steps": 2148, "loss": 0.2302, "lr": 1.1100971919278247e-06, "epoch": 2.4171122994652405, "percentage": 80.59, "elapsed_time": "4:00:54", "remaining_time": "0:58:02"}
1732
+ {"current_steps": 1732, "total_steps": 2148, "loss": 0.2428, "lr": 1.104996728765887e-06, "epoch": 2.418507323878168, "percentage": 80.63, "elapsed_time": "4:01:02", "remaining_time": "0:57:53"}
1733
+ {"current_steps": 1733, "total_steps": 2148, "loss": 0.2413, "lr": 1.0999065539074793e-06, "epoch": 2.419902348291095, "percentage": 80.68, "elapsed_time": "4:01:11", "remaining_time": "0:57:45"}
1734
+ {"current_steps": 1734, "total_steps": 2148, "loss": 0.231, "lr": 1.094826680797843e-06, "epoch": 2.4212973727040223, "percentage": 80.73, "elapsed_time": "4:01:20", "remaining_time": "0:57:37"}
1735
+ {"current_steps": 1735, "total_steps": 2148, "loss": 0.2467, "lr": 1.0897571228550097e-06, "epoch": 2.4226923971169496, "percentage": 80.77, "elapsed_time": "4:01:28", "remaining_time": "0:57:28"}
1736
+ {"current_steps": 1736, "total_steps": 2148, "loss": 0.2423, "lr": 1.0846978934697666e-06, "epoch": 2.424087421529877, "percentage": 80.82, "elapsed_time": "4:01:36", "remaining_time": "0:57:20"}
1737
+ {"current_steps": 1737, "total_steps": 2148, "loss": 0.2341, "lr": 1.0796490060056142e-06, "epoch": 2.425482445942804, "percentage": 80.87, "elapsed_time": "4:01:43", "remaining_time": "0:57:11"}
1738
+ {"current_steps": 1738, "total_steps": 2148, "loss": 0.2293, "lr": 1.074610473798738e-06, "epoch": 2.4268774703557314, "percentage": 80.91, "elapsed_time": "4:01:50", "remaining_time": "0:57:03"}
1739
+ {"current_steps": 1739, "total_steps": 2148, "loss": 0.2223, "lr": 1.0695823101579728e-06, "epoch": 2.4282724947686587, "percentage": 80.96, "elapsed_time": "4:01:57", "remaining_time": "0:56:54"}
1740
+ {"current_steps": 1740, "total_steps": 2148, "loss": 0.2377, "lr": 1.0645645283647616e-06, "epoch": 2.4296675191815855, "percentage": 81.01, "elapsed_time": "4:02:04", "remaining_time": "0:56:45"}
1741
+ {"current_steps": 1741, "total_steps": 2148, "loss": 0.2311, "lr": 1.0595571416731293e-06, "epoch": 2.431062543594513, "percentage": 81.05, "elapsed_time": "4:02:13", "remaining_time": "0:56:37"}
1742
+ {"current_steps": 1742, "total_steps": 2148, "loss": 0.2199, "lr": 1.0545601633096414e-06, "epoch": 2.43245756800744, "percentage": 81.1, "elapsed_time": "4:02:19", "remaining_time": "0:56:28"}
1743
+ {"current_steps": 1743, "total_steps": 2148, "loss": 0.2502, "lr": 1.049573606473369e-06, "epoch": 2.4338525924203673, "percentage": 81.15, "elapsed_time": "4:02:26", "remaining_time": "0:56:20"}
1744
+ {"current_steps": 1744, "total_steps": 2148, "loss": 0.2072, "lr": 1.0445974843358563e-06, "epoch": 2.4352476168332946, "percentage": 81.19, "elapsed_time": "4:02:33", "remaining_time": "0:56:11"}
1745
+ {"current_steps": 1745, "total_steps": 2148, "loss": 0.2224, "lr": 1.0396318100410868e-06, "epoch": 2.436642641246222, "percentage": 81.24, "elapsed_time": "4:02:40", "remaining_time": "0:56:02"}
1746
+ {"current_steps": 1746, "total_steps": 2148, "loss": 0.2581, "lr": 1.0346765967054472e-06, "epoch": 2.438037665659149, "percentage": 81.28, "elapsed_time": "4:02:46", "remaining_time": "0:55:53"}
1747
+ {"current_steps": 1747, "total_steps": 2148, "loss": 0.2598, "lr": 1.029731857417689e-06, "epoch": 2.4394326900720764, "percentage": 81.33, "elapsed_time": "4:02:52", "remaining_time": "0:55:44"}
1748
+ {"current_steps": 1748, "total_steps": 2148, "loss": 0.2369, "lr": 1.0247976052389018e-06, "epoch": 2.4408277144850032, "percentage": 81.38, "elapsed_time": "4:02:59", "remaining_time": "0:55:36"}
1749
+ {"current_steps": 1749, "total_steps": 2148, "loss": 0.2181, "lr": 1.0198738532024715e-06, "epoch": 2.4422227388979305, "percentage": 81.42, "elapsed_time": "4:03:06", "remaining_time": "0:55:27"}
1750
+ {"current_steps": 1750, "total_steps": 2148, "loss": 0.2466, "lr": 1.0149606143140484e-06, "epoch": 2.443617763310858, "percentage": 81.47, "elapsed_time": "4:03:13", "remaining_time": "0:55:18"}
1751
+ {"current_steps": 1751, "total_steps": 2148, "loss": 0.2392, "lr": 1.0100579015515156e-06, "epoch": 2.445012787723785, "percentage": 81.52, "elapsed_time": "4:03:21", "remaining_time": "0:55:10"}
1752
+ {"current_steps": 1752, "total_steps": 2148, "loss": 0.2393, "lr": 1.005165727864953e-06, "epoch": 2.4464078121367123, "percentage": 81.56, "elapsed_time": "4:03:28", "remaining_time": "0:55:01"}
1753
+ {"current_steps": 1753, "total_steps": 2148, "loss": 0.2249, "lr": 1.0002841061765989e-06, "epoch": 2.4478028365496396, "percentage": 81.61, "elapsed_time": "4:03:35", "remaining_time": "0:54:53"}
1754
+ {"current_steps": 1754, "total_steps": 2148, "loss": 0.2337, "lr": 9.954130493808201e-07, "epoch": 2.449197860962567, "percentage": 81.66, "elapsed_time": "4:03:42", "remaining_time": "0:54:44"}
1755
+ {"current_steps": 1755, "total_steps": 2148, "loss": 0.2291, "lr": 9.905525703440815e-07, "epoch": 2.450592885375494, "percentage": 81.7, "elapsed_time": "4:03:49", "remaining_time": "0:54:36"}
1756
+ {"current_steps": 1756, "total_steps": 2148, "loss": 0.2133, "lr": 9.85702681904902e-07, "epoch": 2.4519879097884214, "percentage": 81.75, "elapsed_time": "4:04:00", "remaining_time": "0:54:28"}
1757
+ {"current_steps": 1757, "total_steps": 2148, "loss": 0.2371, "lr": 9.808633968738297e-07, "epoch": 2.4533829342013487, "percentage": 81.8, "elapsed_time": "4:04:07", "remaining_time": "0:54:19"}
1758
+ {"current_steps": 1758, "total_steps": 2148, "loss": 0.2537, "lr": 9.760347280334064e-07, "epoch": 2.454777958614276, "percentage": 81.84, "elapsed_time": "4:04:14", "remaining_time": "0:54:10"}
1759
+ {"current_steps": 1759, "total_steps": 2148, "loss": 0.2427, "lr": 9.712166881381279e-07, "epoch": 2.456172983027203, "percentage": 81.89, "elapsed_time": "4:04:21", "remaining_time": "0:54:02"}
1760
+ {"current_steps": 1760, "total_steps": 2148, "loss": 0.2497, "lr": 9.664092899144156e-07, "epoch": 2.45756800744013, "percentage": 81.94, "elapsed_time": "4:04:28", "remaining_time": "0:53:53"}
1761
+ {"current_steps": 1761, "total_steps": 2148, "loss": 0.2189, "lr": 9.616125460605857e-07, "epoch": 2.4589630318530573, "percentage": 81.98, "elapsed_time": "4:04:37", "remaining_time": "0:53:45"}
1762
+ {"current_steps": 1762, "total_steps": 2148, "loss": 0.2163, "lr": 9.56826469246806e-07, "epoch": 2.4603580562659846, "percentage": 82.03, "elapsed_time": "4:04:46", "remaining_time": "0:53:37"}
1763
+ {"current_steps": 1763, "total_steps": 2148, "loss": 0.2188, "lr": 9.520510721150722e-07, "epoch": 2.461753080678912, "percentage": 82.08, "elapsed_time": "4:04:52", "remaining_time": "0:53:28"}
1764
+ {"current_steps": 1764, "total_steps": 2148, "loss": 0.2784, "lr": 9.472863672791721e-07, "epoch": 2.463148105091839, "percentage": 82.12, "elapsed_time": "4:05:01", "remaining_time": "0:53:20"}
1765
+ {"current_steps": 1765, "total_steps": 2148, "loss": 0.2322, "lr": 9.425323673246461e-07, "epoch": 2.4645431295047664, "percentage": 82.17, "elapsed_time": "4:05:09", "remaining_time": "0:53:11"}
1766
+ {"current_steps": 1766, "total_steps": 2148, "loss": 0.2427, "lr": 9.377890848087595e-07, "epoch": 2.4659381539176937, "percentage": 82.22, "elapsed_time": "4:05:15", "remaining_time": "0:53:03"}
1767
+ {"current_steps": 1767, "total_steps": 2148, "loss": 0.2544, "lr": 9.330565322604729e-07, "epoch": 2.467333178330621, "percentage": 82.26, "elapsed_time": "4:05:28", "remaining_time": "0:52:55"}
1768
+ {"current_steps": 1768, "total_steps": 2148, "loss": 0.2343, "lr": 9.283347221803985e-07, "epoch": 2.468728202743548, "percentage": 82.31, "elapsed_time": "4:05:35", "remaining_time": "0:52:47"}
1769
+ {"current_steps": 1769, "total_steps": 2148, "loss": 0.261, "lr": 9.236236670407772e-07, "epoch": 2.470123227156475, "percentage": 82.36, "elapsed_time": "4:05:42", "remaining_time": "0:52:38"}
1770
+ {"current_steps": 1770, "total_steps": 2148, "loss": 0.2511, "lr": 9.189233792854424e-07, "epoch": 2.4715182515694023, "percentage": 82.4, "elapsed_time": "4:05:48", "remaining_time": "0:52:29"}
1771
+ {"current_steps": 1771, "total_steps": 2148, "loss": 0.2462, "lr": 9.142338713297838e-07, "epoch": 2.4729132759823296, "percentage": 82.45, "elapsed_time": "4:05:57", "remaining_time": "0:52:21"}
1772
+ {"current_steps": 1772, "total_steps": 2148, "loss": 0.2422, "lr": 9.095551555607169e-07, "epoch": 2.474308300395257, "percentage": 82.5, "elapsed_time": "4:06:04", "remaining_time": "0:52:12"}
1773
+ {"current_steps": 1773, "total_steps": 2148, "loss": 0.2473, "lr": 9.048872443366529e-07, "epoch": 2.475703324808184, "percentage": 82.54, "elapsed_time": "4:06:12", "remaining_time": "0:52:04"}
1774
+ {"current_steps": 1774, "total_steps": 2148, "loss": 0.2346, "lr": 9.002301499874622e-07, "epoch": 2.4770983492211114, "percentage": 82.59, "elapsed_time": "4:06:20", "remaining_time": "0:51:56"}
1775
+ {"current_steps": 1775, "total_steps": 2148, "loss": 0.2225, "lr": 8.955838848144449e-07, "epoch": 2.4784933736340387, "percentage": 82.64, "elapsed_time": "4:06:28", "remaining_time": "0:51:47"}
1776
+ {"current_steps": 1776, "total_steps": 2148, "loss": 0.2554, "lr": 8.909484610902958e-07, "epoch": 2.479888398046966, "percentage": 82.68, "elapsed_time": "4:06:38", "remaining_time": "0:51:39"}
1777
+ {"current_steps": 1777, "total_steps": 2148, "loss": 0.2093, "lr": 8.863238910590704e-07, "epoch": 2.481283422459893, "percentage": 82.73, "elapsed_time": "4:06:46", "remaining_time": "0:51:31"}
1778
+ {"current_steps": 1778, "total_steps": 2148, "loss": 0.2481, "lr": 8.817101869361599e-07, "epoch": 2.4826784468728205, "percentage": 82.77, "elapsed_time": "4:06:52", "remaining_time": "0:51:22"}
1779
+ {"current_steps": 1779, "total_steps": 2148, "loss": 0.264, "lr": 8.77107360908253e-07, "epoch": 2.4840734712857477, "percentage": 82.82, "elapsed_time": "4:07:00", "remaining_time": "0:51:14"}
1780
+ {"current_steps": 1780, "total_steps": 2148, "loss": 0.2328, "lr": 8.725154251333012e-07, "epoch": 2.4854684956986746, "percentage": 82.87, "elapsed_time": "4:07:06", "remaining_time": "0:51:05"}
1781
+ {"current_steps": 1781, "total_steps": 2148, "loss": 0.2952, "lr": 8.679343917404959e-07, "epoch": 2.486863520111602, "percentage": 82.91, "elapsed_time": "4:07:19", "remaining_time": "0:50:57"}
1782
+ {"current_steps": 1782, "total_steps": 2148, "loss": 0.239, "lr": 8.633642728302266e-07, "epoch": 2.488258544524529, "percentage": 82.96, "elapsed_time": "4:07:25", "remaining_time": "0:50:49"}
1783
+ {"current_steps": 1783, "total_steps": 2148, "loss": 0.2282, "lr": 8.588050804740527e-07, "epoch": 2.4896535689374564, "percentage": 83.01, "elapsed_time": "4:07:34", "remaining_time": "0:50:40"}
1784
+ {"current_steps": 1784, "total_steps": 2148, "loss": 0.2184, "lr": 8.542568267146761e-07, "epoch": 2.4910485933503836, "percentage": 83.05, "elapsed_time": "4:07:43", "remaining_time": "0:50:32"}
1785
+ {"current_steps": 1785, "total_steps": 2148, "loss": 0.2139, "lr": 8.49719523565904e-07, "epoch": 2.492443617763311, "percentage": 83.1, "elapsed_time": "4:07:50", "remaining_time": "0:50:24"}
1786
+ {"current_steps": 1786, "total_steps": 2148, "loss": 0.2395, "lr": 8.451931830126148e-07, "epoch": 2.493838642176238, "percentage": 83.15, "elapsed_time": "4:07:58", "remaining_time": "0:50:15"}
1787
+ {"current_steps": 1787, "total_steps": 2148, "loss": 0.2276, "lr": 8.40677817010736e-07, "epoch": 2.4952336665891655, "percentage": 83.19, "elapsed_time": "4:08:10", "remaining_time": "0:50:08"}
1788
+ {"current_steps": 1788, "total_steps": 2148, "loss": 0.2396, "lr": 8.361734374872032e-07, "epoch": 2.4966286910020927, "percentage": 83.24, "elapsed_time": "4:08:17", "remaining_time": "0:49:59"}
1789
+ {"current_steps": 1789, "total_steps": 2148, "loss": 0.2243, "lr": 8.316800563399307e-07, "epoch": 2.4980237154150196, "percentage": 83.29, "elapsed_time": "4:08:24", "remaining_time": "0:49:50"}
1790
+ {"current_steps": 1790, "total_steps": 2148, "loss": 0.2184, "lr": 8.271976854377861e-07, "epoch": 2.499418739827947, "percentage": 83.33, "elapsed_time": "4:08:30", "remaining_time": "0:49:42"}
1791
+ {"current_steps": 1791, "total_steps": 2148, "loss": 0.2617, "lr": 8.227263366205523e-07, "epoch": 2.500813764240874, "percentage": 83.38, "elapsed_time": "4:08:39", "remaining_time": "0:49:33"}
1792
+ {"current_steps": 1792, "total_steps": 2148, "loss": 0.3254, "lr": 8.182660216988964e-07, "epoch": 2.5022087886538014, "percentage": 83.43, "elapsed_time": "4:08:46", "remaining_time": "0:49:25"}
1793
+ {"current_steps": 1793, "total_steps": 2148, "loss": 0.2494, "lr": 8.138167524543445e-07, "epoch": 2.5036038130667286, "percentage": 83.47, "elapsed_time": "4:08:52", "remaining_time": "0:49:16"}
1794
+ {"current_steps": 1794, "total_steps": 2148, "loss": 0.2518, "lr": 8.09378540639243e-07, "epoch": 2.504998837479656, "percentage": 83.52, "elapsed_time": "4:09:03", "remaining_time": "0:49:08"}
1795
+ {"current_steps": 1795, "total_steps": 2148, "loss": 0.2461, "lr": 8.049513979767304e-07, "epoch": 2.506393861892583, "percentage": 83.57, "elapsed_time": "4:09:10", "remaining_time": "0:49:00"}
1796
+ {"current_steps": 1796, "total_steps": 2148, "loss": 0.1999, "lr": 8.00535336160711e-07, "epoch": 2.5077888863055104, "percentage": 83.61, "elapsed_time": "4:09:16", "remaining_time": "0:48:51"}
1797
+ {"current_steps": 1797, "total_steps": 2148, "loss": 0.2423, "lr": 7.96130366855819e-07, "epoch": 2.5091839107184377, "percentage": 83.66, "elapsed_time": "4:09:22", "remaining_time": "0:48:42"}
1798
+ {"current_steps": 1798, "total_steps": 2148, "loss": 0.2203, "lr": 7.917365016973866e-07, "epoch": 2.510578935131365, "percentage": 83.71, "elapsed_time": "4:09:29", "remaining_time": "0:48:33"}
1799
+ {"current_steps": 1799, "total_steps": 2148, "loss": 0.2518, "lr": 7.873537522914155e-07, "epoch": 2.5119739595442923, "percentage": 83.75, "elapsed_time": "4:09:38", "remaining_time": "0:48:25"}
1800
+ {"current_steps": 1800, "total_steps": 2148, "loss": 0.2359, "lr": 7.829821302145485e-07, "epoch": 2.5133689839572195, "percentage": 83.8, "elapsed_time": "4:09:45", "remaining_time": "0:48:17"}
1801
+ {"current_steps": 1801, "total_steps": 2148, "loss": 0.2333, "lr": 7.786216470140334e-07, "epoch": 2.5147640083701464, "percentage": 83.85, "elapsed_time": "4:09:52", "remaining_time": "0:48:08"}
1802
+ {"current_steps": 1802, "total_steps": 2148, "loss": 0.2298, "lr": 7.742723142076991e-07, "epoch": 2.5161590327830736, "percentage": 83.89, "elapsed_time": "4:09:59", "remaining_time": "0:47:59"}
1803
+ {"current_steps": 1803, "total_steps": 2148, "loss": 0.245, "lr": 7.699341432839203e-07, "epoch": 2.517554057196001, "percentage": 83.94, "elapsed_time": "4:10:05", "remaining_time": "0:47:51"}
1804
+ {"current_steps": 1804, "total_steps": 2148, "loss": 0.2082, "lr": 7.656071457015879e-07, "epoch": 2.518949081608928, "percentage": 83.99, "elapsed_time": "4:10:12", "remaining_time": "0:47:42"}
1805
+ {"current_steps": 1805, "total_steps": 2148, "loss": 0.2297, "lr": 7.612913328900784e-07, "epoch": 2.5203441060218554, "percentage": 84.03, "elapsed_time": "4:10:22", "remaining_time": "0:47:34"}
1806
+ {"current_steps": 1806, "total_steps": 2148, "loss": 0.2006, "lr": 7.569867162492283e-07, "epoch": 2.5217391304347827, "percentage": 84.08, "elapsed_time": "4:10:31", "remaining_time": "0:47:26"}
1807
+ {"current_steps": 1807, "total_steps": 2148, "loss": 0.2649, "lr": 7.526933071492959e-07, "epoch": 2.52313415484771, "percentage": 84.12, "elapsed_time": "4:10:43", "remaining_time": "0:47:18"}
1808
+ {"current_steps": 1808, "total_steps": 2148, "loss": 0.2274, "lr": 7.484111169309399e-07, "epoch": 2.524529179260637, "percentage": 84.17, "elapsed_time": "4:10:51", "remaining_time": "0:47:10"}
1809
+ {"current_steps": 1809, "total_steps": 2148, "loss": 0.2304, "lr": 7.441401569051848e-07, "epoch": 2.525924203673564, "percentage": 84.22, "elapsed_time": "4:11:03", "remaining_time": "0:47:02"}
1810
+ {"current_steps": 1810, "total_steps": 2148, "loss": 0.2153, "lr": 7.398804383533886e-07, "epoch": 2.5273192280864913, "percentage": 84.26, "elapsed_time": "4:11:10", "remaining_time": "0:46:54"}
1811
+ {"current_steps": 1811, "total_steps": 2148, "loss": 0.2349, "lr": 7.356319725272165e-07, "epoch": 2.5287142524994186, "percentage": 84.31, "elapsed_time": "4:11:16", "remaining_time": "0:46:45"}
1812
+ {"current_steps": 1812, "total_steps": 2148, "loss": 0.2438, "lr": 7.313947706486136e-07, "epoch": 2.530109276912346, "percentage": 84.36, "elapsed_time": "4:11:26", "remaining_time": "0:46:37"}
1813
+ {"current_steps": 1813, "total_steps": 2148, "loss": 0.2594, "lr": 7.271688439097713e-07, "epoch": 2.531504301325273, "percentage": 84.4, "elapsed_time": "4:11:36", "remaining_time": "0:46:29"}
1814
+ {"current_steps": 1814, "total_steps": 2148, "loss": 0.1927, "lr": 7.229542034730952e-07, "epoch": 2.5328993257382004, "percentage": 84.45, "elapsed_time": "4:11:43", "remaining_time": "0:46:20"}
1815
+ {"current_steps": 1815, "total_steps": 2148, "loss": 0.2412, "lr": 7.187508604711851e-07, "epoch": 2.5342943501511277, "percentage": 84.5, "elapsed_time": "4:11:52", "remaining_time": "0:46:12"}
1816
+ {"current_steps": 1816, "total_steps": 2148, "loss": 0.2534, "lr": 7.145588260067943e-07, "epoch": 2.535689374564055, "percentage": 84.54, "elapsed_time": "4:12:00", "remaining_time": "0:46:04"}
1817
+ {"current_steps": 1817, "total_steps": 2148, "loss": 0.239, "lr": 7.103781111528074e-07, "epoch": 2.5370843989769822, "percentage": 84.59, "elapsed_time": "4:12:11", "remaining_time": "0:45:56"}
1818
+ {"current_steps": 1818, "total_steps": 2148, "loss": 0.208, "lr": 7.062087269522105e-07, "epoch": 2.5384794233899095, "percentage": 84.64, "elapsed_time": "4:12:18", "remaining_time": "0:45:47"}
1819
+ {"current_steps": 1819, "total_steps": 2148, "loss": 0.2397, "lr": 7.020506844180608e-07, "epoch": 2.5398744478028368, "percentage": 84.68, "elapsed_time": "4:12:26", "remaining_time": "0:45:39"}
1820
+ {"current_steps": 1820, "total_steps": 2148, "loss": 0.245, "lr": 6.979039945334543e-07, "epoch": 2.541269472215764, "percentage": 84.73, "elapsed_time": "4:12:32", "remaining_time": "0:45:30"}
1821
+ {"current_steps": 1821, "total_steps": 2148, "loss": 0.2358, "lr": 6.937686682515044e-07, "epoch": 2.542664496628691, "percentage": 84.78, "elapsed_time": "4:12:39", "remaining_time": "0:45:22"}
1822
+ {"current_steps": 1822, "total_steps": 2148, "loss": 0.2563, "lr": 6.896447164953057e-07, "epoch": 2.544059521041618, "percentage": 84.82, "elapsed_time": "4:12:46", "remaining_time": "0:45:13"}
1823
+ {"current_steps": 1823, "total_steps": 2148, "loss": 0.2371, "lr": 6.855321501579077e-07, "epoch": 2.5454545454545454, "percentage": 84.87, "elapsed_time": "4:12:56", "remaining_time": "0:45:05"}
1824
+ {"current_steps": 1824, "total_steps": 2148, "loss": 0.2388, "lr": 6.814309801022873e-07, "epoch": 2.5468495698674727, "percentage": 84.92, "elapsed_time": "4:13:06", "remaining_time": "0:44:57"}
1825
+ {"current_steps": 1825, "total_steps": 2148, "loss": 0.2625, "lr": 6.77341217161322e-07, "epoch": 2.5482445942804, "percentage": 84.96, "elapsed_time": "4:13:13", "remaining_time": "0:44:48"}
1826
+ {"current_steps": 1826, "total_steps": 2148, "loss": 0.2172, "lr": 6.732628721377533e-07, "epoch": 2.5496396186933272, "percentage": 85.01, "elapsed_time": "4:13:19", "remaining_time": "0:44:40"}
1827
+ {"current_steps": 1827, "total_steps": 2148, "loss": 0.289, "lr": 6.69195955804165e-07, "epoch": 2.5510346431062545, "percentage": 85.06, "elapsed_time": "4:13:26", "remaining_time": "0:44:31"}
1828
+ {"current_steps": 1828, "total_steps": 2148, "loss": 0.2345, "lr": 6.651404789029553e-07, "epoch": 2.5524296675191813, "percentage": 85.1, "elapsed_time": "4:13:37", "remaining_time": "0:44:23"}
1829
+ {"current_steps": 1829, "total_steps": 2148, "loss": 0.2353, "lr": 6.610964521463032e-07, "epoch": 2.5538246919321086, "percentage": 85.15, "elapsed_time": "4:13:47", "remaining_time": "0:44:15"}
1830
+ {"current_steps": 1830, "total_steps": 2148, "loss": 0.2114, "lr": 6.570638862161449e-07, "epoch": 2.555219716345036, "percentage": 85.2, "elapsed_time": "4:13:54", "remaining_time": "0:44:07"}
1831
+ {"current_steps": 1831, "total_steps": 2148, "loss": 0.2164, "lr": 6.530427917641447e-07, "epoch": 2.556614740757963, "percentage": 85.24, "elapsed_time": "4:14:02", "remaining_time": "0:43:58"}
1832
+ {"current_steps": 1832, "total_steps": 2148, "loss": 0.2533, "lr": 6.490331794116633e-07, "epoch": 2.5580097651708904, "percentage": 85.29, "elapsed_time": "4:14:10", "remaining_time": "0:43:50"}
1833
+ {"current_steps": 1833, "total_steps": 2148, "loss": 0.2094, "lr": 6.450350597497335e-07, "epoch": 2.5594047895838177, "percentage": 85.34, "elapsed_time": "4:14:17", "remaining_time": "0:43:41"}
1834
+ {"current_steps": 1834, "total_steps": 2148, "loss": 0.2552, "lr": 6.410484433390335e-07, "epoch": 2.560799813996745, "percentage": 85.38, "elapsed_time": "4:14:27", "remaining_time": "0:43:33"}
1835
+ {"current_steps": 1835, "total_steps": 2148, "loss": 0.2034, "lr": 6.370733407098517e-07, "epoch": 2.562194838409672, "percentage": 85.43, "elapsed_time": "4:14:36", "remaining_time": "0:43:25"}
1836
+ {"current_steps": 1836, "total_steps": 2148, "loss": 0.2379, "lr": 6.331097623620697e-07, "epoch": 2.5635898628225995, "percentage": 85.47, "elapsed_time": "4:14:47", "remaining_time": "0:43:17"}
1837
+ {"current_steps": 1837, "total_steps": 2148, "loss": 0.223, "lr": 6.291577187651255e-07, "epoch": 2.5649848872355268, "percentage": 85.52, "elapsed_time": "4:14:53", "remaining_time": "0:43:09"}
1838
+ {"current_steps": 1838, "total_steps": 2148, "loss": 0.2411, "lr": 6.252172203579892e-07, "epoch": 2.566379911648454, "percentage": 85.57, "elapsed_time": "4:15:00", "remaining_time": "0:43:00"}
1839
+ {"current_steps": 1839, "total_steps": 2148, "loss": 0.269, "lr": 6.212882775491352e-07, "epoch": 2.5677749360613813, "percentage": 85.61, "elapsed_time": "4:15:09", "remaining_time": "0:42:52"}
1840
+ {"current_steps": 1840, "total_steps": 2148, "loss": 0.2432, "lr": 6.173709007165158e-07, "epoch": 2.5691699604743086, "percentage": 85.66, "elapsed_time": "4:15:17", "remaining_time": "0:42:44"}
1841
+ {"current_steps": 1841, "total_steps": 2148, "loss": 0.2335, "lr": 6.134651002075315e-07, "epoch": 2.5705649848872354, "percentage": 85.71, "elapsed_time": "4:15:25", "remaining_time": "0:42:35"}
1842
+ {"current_steps": 1842, "total_steps": 2148, "loss": 0.2428, "lr": 6.095708863390065e-07, "epoch": 2.5719600093001627, "percentage": 85.75, "elapsed_time": "4:15:34", "remaining_time": "0:42:27"}
1843
+ {"current_steps": 1843, "total_steps": 2148, "loss": 0.2201, "lr": 6.056882693971605e-07, "epoch": 2.57335503371309, "percentage": 85.8, "elapsed_time": "4:15:42", "remaining_time": "0:42:18"}
1844
+ {"current_steps": 1844, "total_steps": 2148, "loss": 0.2652, "lr": 6.018172596375776e-07, "epoch": 2.574750058126017, "percentage": 85.85, "elapsed_time": "4:15:48", "remaining_time": "0:42:10"}
1845
+ {"current_steps": 1845, "total_steps": 2148, "loss": 0.2481, "lr": 5.979578672851843e-07, "epoch": 2.5761450825389445, "percentage": 85.89, "elapsed_time": "4:15:59", "remaining_time": "0:42:02"}
1846
+ {"current_steps": 1846, "total_steps": 2148, "loss": 0.2221, "lr": 5.941101025342239e-07, "epoch": 2.5775401069518717, "percentage": 85.94, "elapsed_time": "4:16:09", "remaining_time": "0:41:54"}
1847
+ {"current_steps": 1847, "total_steps": 2148, "loss": 0.29, "lr": 5.902739755482201e-07, "epoch": 2.578935131364799, "percentage": 85.99, "elapsed_time": "4:16:17", "remaining_time": "0:41:45"}
1848
+ {"current_steps": 1848, "total_steps": 2148, "loss": 0.2135, "lr": 5.864494964599615e-07, "epoch": 2.580330155777726, "percentage": 86.03, "elapsed_time": "4:16:23", "remaining_time": "0:41:37"}
1849
+ {"current_steps": 1849, "total_steps": 2148, "loss": 0.2359, "lr": 5.826366753714707e-07, "epoch": 2.581725180190653, "percentage": 86.08, "elapsed_time": "4:16:33", "remaining_time": "0:41:29"}
1850
+ {"current_steps": 1850, "total_steps": 2148, "loss": 0.2244, "lr": 5.788355223539698e-07, "epoch": 2.5831202046035804, "percentage": 86.13, "elapsed_time": "4:16:42", "remaining_time": "0:41:21"}
1851
+ {"current_steps": 1851, "total_steps": 2148, "loss": 0.2228, "lr": 5.750460474478675e-07, "epoch": 2.5845152290165077, "percentage": 86.17, "elapsed_time": "4:16:49", "remaining_time": "0:41:12"}
1852
+ {"current_steps": 1852, "total_steps": 2148, "loss": 0.2294, "lr": 5.712682606627251e-07, "epoch": 2.585910253429435, "percentage": 86.22, "elapsed_time": "4:16:56", "remaining_time": "0:41:03"}
1853
+ {"current_steps": 1853, "total_steps": 2148, "loss": 0.2463, "lr": 5.675021719772262e-07, "epoch": 2.587305277842362, "percentage": 86.27, "elapsed_time": "4:17:07", "remaining_time": "0:40:56"}
1854
+ {"current_steps": 1854, "total_steps": 2148, "loss": 0.2242, "lr": 5.637477913391604e-07, "epoch": 2.5887003022552895, "percentage": 86.31, "elapsed_time": "4:17:13", "remaining_time": "0:40:47"}
1855
+ {"current_steps": 1855, "total_steps": 2148, "loss": 0.2568, "lr": 5.600051286653884e-07, "epoch": 2.5900953266682167, "percentage": 86.36, "elapsed_time": "4:17:23", "remaining_time": "0:40:39"}
1856
+ {"current_steps": 1856, "total_steps": 2148, "loss": 0.2281, "lr": 5.562741938418187e-07, "epoch": 2.591490351081144, "percentage": 86.41, "elapsed_time": "4:17:29", "remaining_time": "0:40:30"}
1857
+ {"current_steps": 1857, "total_steps": 2148, "loss": 0.2368, "lr": 5.525549967233829e-07, "epoch": 2.5928853754940713, "percentage": 86.45, "elapsed_time": "4:17:36", "remaining_time": "0:40:22"}
1858
+ {"current_steps": 1858, "total_steps": 2148, "loss": 0.2341, "lr": 5.488475471340099e-07, "epoch": 2.5942803999069985, "percentage": 86.5, "elapsed_time": "4:17:44", "remaining_time": "0:40:13"}
1859
+ {"current_steps": 1859, "total_steps": 2148, "loss": 0.2429, "lr": 5.451518548665946e-07, "epoch": 2.595675424319926, "percentage": 86.55, "elapsed_time": "4:17:51", "remaining_time": "0:40:05"}
1860
+ {"current_steps": 1860, "total_steps": 2148, "loss": 0.2287, "lr": 5.414679296829806e-07, "epoch": 2.597070448732853, "percentage": 86.59, "elapsed_time": "4:17:57", "remaining_time": "0:39:56"}
1861
+ {"current_steps": 1861, "total_steps": 2148, "loss": 0.1991, "lr": 5.377957813139262e-07, "epoch": 2.59846547314578, "percentage": 86.64, "elapsed_time": "4:18:05", "remaining_time": "0:39:48"}
1862
+ {"current_steps": 1862, "total_steps": 2148, "loss": 0.3004, "lr": 5.341354194590831e-07, "epoch": 2.599860497558707, "percentage": 86.69, "elapsed_time": "4:18:11", "remaining_time": "0:39:39"}
1863
+ {"current_steps": 1863, "total_steps": 2148, "loss": 0.2219, "lr": 5.304868537869706e-07, "epoch": 2.6012555219716345, "percentage": 86.73, "elapsed_time": "4:18:18", "remaining_time": "0:39:30"}
1864
+ {"current_steps": 1864, "total_steps": 2148, "loss": 0.2283, "lr": 5.268500939349514e-07, "epoch": 2.6026505463845617, "percentage": 86.78, "elapsed_time": "4:18:25", "remaining_time": "0:39:22"}
1865
+ {"current_steps": 1865, "total_steps": 2148, "loss": 0.2133, "lr": 5.232251495091989e-07, "epoch": 2.604045570797489, "percentage": 86.82, "elapsed_time": "4:18:32", "remaining_time": "0:39:13"}
1866
+ {"current_steps": 1866, "total_steps": 2148, "loss": 0.221, "lr": 5.196120300846835e-07, "epoch": 2.6054405952104163, "percentage": 86.87, "elapsed_time": "4:18:39", "remaining_time": "0:39:05"}
1867
+ {"current_steps": 1867, "total_steps": 2148, "loss": 0.2478, "lr": 5.160107452051361e-07, "epoch": 2.6068356196233435, "percentage": 86.92, "elapsed_time": "4:18:45", "remaining_time": "0:38:56"}
1868
+ {"current_steps": 1868, "total_steps": 2148, "loss": 0.2033, "lr": 5.124213043830278e-07, "epoch": 2.6082306440362704, "percentage": 86.96, "elapsed_time": "4:18:51", "remaining_time": "0:38:48"}
1869
+ {"current_steps": 1869, "total_steps": 2148, "loss": 0.2132, "lr": 5.088437170995481e-07, "epoch": 2.6096256684491976, "percentage": 87.01, "elapsed_time": "4:18:58", "remaining_time": "0:38:39"}
1870
+ {"current_steps": 1870, "total_steps": 2148, "loss": 0.2257, "lr": 5.052779928045737e-07, "epoch": 2.611020692862125, "percentage": 87.06, "elapsed_time": "4:19:04", "remaining_time": "0:38:30"}
1871
+ {"current_steps": 1871, "total_steps": 2148, "loss": 0.2365, "lr": 5.01724140916649e-07, "epoch": 2.612415717275052, "percentage": 87.1, "elapsed_time": "4:19:13", "remaining_time": "0:38:22"}
1872
+ {"current_steps": 1872, "total_steps": 2148, "loss": 0.2523, "lr": 4.981821708229545e-07, "epoch": 2.6138107416879794, "percentage": 87.15, "elapsed_time": "4:19:19", "remaining_time": "0:38:13"}
1873
+ {"current_steps": 1873, "total_steps": 2148, "loss": 0.22, "lr": 4.946520918792886e-07, "epoch": 2.6152057661009067, "percentage": 87.2, "elapsed_time": "4:19:25", "remaining_time": "0:38:05"}
1874
+ {"current_steps": 1874, "total_steps": 2148, "loss": 0.2504, "lr": 4.911339134100401e-07, "epoch": 2.616600790513834, "percentage": 87.24, "elapsed_time": "4:19:32", "remaining_time": "0:37:56"}
1875
+ {"current_steps": 1875, "total_steps": 2148, "loss": 0.2391, "lr": 4.87627644708163e-07, "epoch": 2.6179958149267613, "percentage": 87.29, "elapsed_time": "4:19:42", "remaining_time": "0:37:48"}
1876
+ {"current_steps": 1876, "total_steps": 2148, "loss": 0.2452, "lr": 4.841332950351535e-07, "epoch": 2.6193908393396885, "percentage": 87.34, "elapsed_time": "4:19:49", "remaining_time": "0:37:40"}
1877
+ {"current_steps": 1877, "total_steps": 2148, "loss": 0.2378, "lr": 4.806508736210253e-07, "epoch": 2.620785863752616, "percentage": 87.38, "elapsed_time": "4:20:01", "remaining_time": "0:37:32"}
1878
+ {"current_steps": 1878, "total_steps": 2148, "loss": 0.218, "lr": 4.771803896642812e-07, "epoch": 2.622180888165543, "percentage": 87.43, "elapsed_time": "4:20:14", "remaining_time": "0:37:24"}
1879
+ {"current_steps": 1879, "total_steps": 2148, "loss": 0.2575, "lr": 4.737218523318965e-07, "epoch": 2.6235759125784703, "percentage": 87.48, "elapsed_time": "4:20:21", "remaining_time": "0:37:16"}
1880
+ {"current_steps": 1880, "total_steps": 2148, "loss": 0.2195, "lr": 4.7027527075929e-07, "epoch": 2.6249709369913976, "percentage": 87.52, "elapsed_time": "4:20:27", "remaining_time": "0:37:07"}
1881
+ {"current_steps": 1881, "total_steps": 2148, "loss": 0.2384, "lr": 4.6684065405029677e-07, "epoch": 2.6263659614043244, "percentage": 87.57, "elapsed_time": "4:20:34", "remaining_time": "0:36:59"}
1882
+ {"current_steps": 1882, "total_steps": 2148, "loss": 0.2247, "lr": 4.6341801127715303e-07, "epoch": 2.6277609858172517, "percentage": 87.62, "elapsed_time": "4:20:41", "remaining_time": "0:36:50"}
1883
+ {"current_steps": 1883, "total_steps": 2148, "loss": 0.2536, "lr": 4.6000735148046316e-07, "epoch": 2.629156010230179, "percentage": 87.66, "elapsed_time": "4:20:52", "remaining_time": "0:36:42"}
1884
+ {"current_steps": 1884, "total_steps": 2148, "loss": 0.2277, "lr": 4.566086836691791e-07, "epoch": 2.6305510346431062, "percentage": 87.71, "elapsed_time": "4:20:59", "remaining_time": "0:36:34"}
1885
+ {"current_steps": 1885, "total_steps": 2148, "loss": 0.2421, "lr": 4.532220168205798e-07, "epoch": 2.6319460590560335, "percentage": 87.76, "elapsed_time": "4:21:06", "remaining_time": "0:36:25"}
1886
+ {"current_steps": 1886, "total_steps": 2148, "loss": 0.2053, "lr": 4.498473598802444e-07, "epoch": 2.633341083468961, "percentage": 87.8, "elapsed_time": "4:21:16", "remaining_time": "0:36:17"}
1887
+ {"current_steps": 1887, "total_steps": 2148, "loss": 0.2315, "lr": 4.464847217620266e-07, "epoch": 2.634736107881888, "percentage": 87.85, "elapsed_time": "4:21:23", "remaining_time": "0:36:09"}
1888
+ {"current_steps": 1888, "total_steps": 2148, "loss": 0.2463, "lr": 4.4313411134803584e-07, "epoch": 2.636131132294815, "percentage": 87.9, "elapsed_time": "4:21:29", "remaining_time": "0:36:00"}
1889
+ {"current_steps": 1889, "total_steps": 2148, "loss": 0.2174, "lr": 4.397955374886104e-07, "epoch": 2.637526156707742, "percentage": 87.94, "elapsed_time": "4:21:42", "remaining_time": "0:35:52"}
1890
+ {"current_steps": 1890, "total_steps": 2148, "loss": 0.2393, "lr": 4.364690090022938e-07, "epoch": 2.6389211811206694, "percentage": 87.99, "elapsed_time": "4:21:51", "remaining_time": "0:35:44"}
1891
+ {"current_steps": 1891, "total_steps": 2148, "loss": 0.2322, "lr": 4.331545346758159e-07, "epoch": 2.6403162055335967, "percentage": 88.04, "elapsed_time": "4:22:05", "remaining_time": "0:35:37"}
1892
+ {"current_steps": 1892, "total_steps": 2148, "loss": 0.2112, "lr": 4.2985212326406456e-07, "epoch": 2.641711229946524, "percentage": 88.08, "elapsed_time": "4:22:12", "remaining_time": "0:35:28"}
1893
+ {"current_steps": 1893, "total_steps": 2148, "loss": 0.2139, "lr": 4.265617834900637e-07, "epoch": 2.6431062543594512, "percentage": 88.13, "elapsed_time": "4:22:23", "remaining_time": "0:35:20"}
1894
+ {"current_steps": 1894, "total_steps": 2148, "loss": 0.2031, "lr": 4.2328352404495346e-07, "epoch": 2.6445012787723785, "percentage": 88.18, "elapsed_time": "4:22:30", "remaining_time": "0:35:12"}
1895
+ {"current_steps": 1895, "total_steps": 2148, "loss": 0.2053, "lr": 4.2001735358796316e-07, "epoch": 2.6458963031853058, "percentage": 88.22, "elapsed_time": "4:22:37", "remaining_time": "0:35:03"}
1896
+ {"current_steps": 1896, "total_steps": 2148, "loss": 0.2058, "lr": 4.167632807463895e-07, "epoch": 2.647291327598233, "percentage": 88.27, "elapsed_time": "4:22:50", "remaining_time": "0:34:56"}
1897
+ {"current_steps": 1897, "total_steps": 2148, "loss": 0.227, "lr": 4.135213141155769e-07, "epoch": 2.6486863520111603, "percentage": 88.31, "elapsed_time": "4:22:57", "remaining_time": "0:34:47"}
1898
+ {"current_steps": 1898, "total_steps": 2148, "loss": 0.2367, "lr": 4.1029146225889103e-07, "epoch": 2.6500813764240876, "percentage": 88.36, "elapsed_time": "4:23:05", "remaining_time": "0:34:39"}
1899
+ {"current_steps": 1899, "total_steps": 2148, "loss": 0.2345, "lr": 4.0707373370769634e-07, "epoch": 2.651476400837015, "percentage": 88.41, "elapsed_time": "4:23:11", "remaining_time": "0:34:30"}
1900
+ {"current_steps": 1900, "total_steps": 2148, "loss": 0.235, "lr": 4.0386813696133564e-07, "epoch": 2.652871425249942, "percentage": 88.45, "elapsed_time": "4:23:17", "remaining_time": "0:34:22"}
1901
+ {"current_steps": 1901, "total_steps": 2148, "loss": 0.2194, "lr": 4.0067468048710756e-07, "epoch": 2.654266449662869, "percentage": 88.5, "elapsed_time": "4:23:25", "remaining_time": "0:34:13"}
1902
+ {"current_steps": 1902, "total_steps": 2148, "loss": 0.228, "lr": 3.974933727202412e-07, "epoch": 2.6556614740757962, "percentage": 88.55, "elapsed_time": "4:23:33", "remaining_time": "0:34:05"}
1903
+ {"current_steps": 1903, "total_steps": 2148, "loss": 0.2135, "lr": 3.943242220638777e-07, "epoch": 2.6570564984887235, "percentage": 88.59, "elapsed_time": "4:23:41", "remaining_time": "0:33:56"}
1904
+ {"current_steps": 1904, "total_steps": 2148, "loss": 0.2403, "lr": 3.911672368890462e-07, "epoch": 2.6584515229016508, "percentage": 88.64, "elapsed_time": "4:23:47", "remaining_time": "0:33:48"}
1905
+ {"current_steps": 1905, "total_steps": 2148, "loss": 0.2307, "lr": 3.8802242553464096e-07, "epoch": 2.659846547314578, "percentage": 88.69, "elapsed_time": "4:23:55", "remaining_time": "0:33:39"}
1906
+ {"current_steps": 1906, "total_steps": 2148, "loss": 0.2272, "lr": 3.8488979630739996e-07, "epoch": 2.6612415717275053, "percentage": 88.73, "elapsed_time": "4:24:05", "remaining_time": "0:33:31"}
1907
+ {"current_steps": 1907, "total_steps": 2148, "loss": 0.1872, "lr": 3.8176935748188425e-07, "epoch": 2.6626365961404326, "percentage": 88.78, "elapsed_time": "4:24:17", "remaining_time": "0:33:24"}
1908
+ {"current_steps": 1908, "total_steps": 2148, "loss": 0.2069, "lr": 3.78661117300454e-07, "epoch": 2.66403162055336, "percentage": 88.83, "elapsed_time": "4:24:27", "remaining_time": "0:33:15"}
1909
+ {"current_steps": 1909, "total_steps": 2148, "loss": 0.2139, "lr": 3.755650839732489e-07, "epoch": 2.6654266449662867, "percentage": 88.87, "elapsed_time": "4:24:34", "remaining_time": "0:33:07"}
1910
+ {"current_steps": 1910, "total_steps": 2148, "loss": 0.2557, "lr": 3.7248126567816454e-07, "epoch": 2.666821669379214, "percentage": 88.92, "elapsed_time": "4:24:40", "remaining_time": "0:32:58"}
1911
+ {"current_steps": 1911, "total_steps": 2148, "loss": 0.2375, "lr": 3.694096705608319e-07, "epoch": 2.668216693792141, "percentage": 88.97, "elapsed_time": "4:24:50", "remaining_time": "0:32:50"}
1912
+ {"current_steps": 1912, "total_steps": 2148, "loss": 0.2215, "lr": 3.6635030673459413e-07, "epoch": 2.6696117182050685, "percentage": 89.01, "elapsed_time": "4:24:59", "remaining_time": "0:32:42"}
1913
+ {"current_steps": 1913, "total_steps": 2148, "loss": 0.248, "lr": 3.6330318228049e-07, "epoch": 2.6710067426179958, "percentage": 89.06, "elapsed_time": "4:25:07", "remaining_time": "0:32:34"}
1914
+ {"current_steps": 1914, "total_steps": 2148, "loss": 0.2407, "lr": 3.6026830524722443e-07, "epoch": 2.672401767030923, "percentage": 89.11, "elapsed_time": "4:25:13", "remaining_time": "0:32:25"}
1915
+ {"current_steps": 1915, "total_steps": 2148, "loss": 0.2443, "lr": 3.572456836511551e-07, "epoch": 2.6737967914438503, "percentage": 89.15, "elapsed_time": "4:25:25", "remaining_time": "0:32:17"}
1916
+ {"current_steps": 1916, "total_steps": 2148, "loss": 0.2205, "lr": 3.5423532547626816e-07, "epoch": 2.6751918158567776, "percentage": 89.2, "elapsed_time": "4:25:33", "remaining_time": "0:32:09"}
1917
+ {"current_steps": 1917, "total_steps": 2148, "loss": 0.1948, "lr": 3.5123723867415527e-07, "epoch": 2.676586840269705, "percentage": 89.25, "elapsed_time": "4:25:44", "remaining_time": "0:32:01"}
1918
+ {"current_steps": 1918, "total_steps": 2148, "loss": 0.2197, "lr": 3.4825143116399454e-07, "epoch": 2.677981864682632, "percentage": 89.29, "elapsed_time": "4:25:51", "remaining_time": "0:31:52"}
1919
+ {"current_steps": 1919, "total_steps": 2148, "loss": 0.2173, "lr": 3.452779108325316e-07, "epoch": 2.6793768890955594, "percentage": 89.34, "elapsed_time": "4:25:57", "remaining_time": "0:31:44"}
1920
+ {"current_steps": 1920, "total_steps": 2148, "loss": 0.2216, "lr": 3.4231668553405316e-07, "epoch": 2.6807719135084866, "percentage": 89.39, "elapsed_time": "4:26:04", "remaining_time": "0:31:35"}
1921
+ {"current_steps": 1921, "total_steps": 2148, "loss": 0.2404, "lr": 3.39367763090373e-07, "epoch": 2.6821669379214135, "percentage": 89.43, "elapsed_time": "4:26:10", "remaining_time": "0:31:27"}
1922
+ {"current_steps": 1922, "total_steps": 2148, "loss": 0.2371, "lr": 3.3643115129080695e-07, "epoch": 2.6835619623343407, "percentage": 89.48, "elapsed_time": "4:26:20", "remaining_time": "0:31:19"}
1923
+ {"current_steps": 1923, "total_steps": 2148, "loss": 0.2249, "lr": 3.3350685789215133e-07, "epoch": 2.684956986747268, "percentage": 89.53, "elapsed_time": "4:26:32", "remaining_time": "0:31:11"}
1924
+ {"current_steps": 1924, "total_steps": 2148, "loss": 0.2453, "lr": 3.3059489061866625e-07, "epoch": 2.6863520111601953, "percentage": 89.57, "elapsed_time": "4:26:40", "remaining_time": "0:31:02"}
1925
+ {"current_steps": 1925, "total_steps": 2148, "loss": 0.2521, "lr": 3.276952571620556e-07, "epoch": 2.6877470355731226, "percentage": 89.62, "elapsed_time": "4:26:52", "remaining_time": "0:30:54"}
1926
+ {"current_steps": 1926, "total_steps": 2148, "loss": 0.231, "lr": 3.248079651814395e-07, "epoch": 2.68914205998605, "percentage": 89.66, "elapsed_time": "4:26:59", "remaining_time": "0:30:46"}
1927
+ {"current_steps": 1927, "total_steps": 2148, "loss": 0.196, "lr": 3.2193302230334455e-07, "epoch": 2.690537084398977, "percentage": 89.71, "elapsed_time": "4:27:06", "remaining_time": "0:30:37"}
1928
+ {"current_steps": 1928, "total_steps": 2148, "loss": 0.2119, "lr": 3.190704361216751e-07, "epoch": 2.6919321088119044, "percentage": 89.76, "elapsed_time": "4:27:12", "remaining_time": "0:30:29"}
1929
+ {"current_steps": 1929, "total_steps": 2148, "loss": 0.2647, "lr": 3.162202141976956e-07, "epoch": 2.693327133224831, "percentage": 89.8, "elapsed_time": "4:27:20", "remaining_time": "0:30:21"}
1930
+ {"current_steps": 1930, "total_steps": 2148, "loss": 0.2589, "lr": 3.133823640600137e-07, "epoch": 2.6947221576377585, "percentage": 89.85, "elapsed_time": "4:27:28", "remaining_time": "0:30:12"}
1931
+ {"current_steps": 1931, "total_steps": 2148, "loss": 0.2499, "lr": 3.105568932045577e-07, "epoch": 2.6961171820506857, "percentage": 89.9, "elapsed_time": "4:27:35", "remaining_time": "0:30:04"}
1932
+ {"current_steps": 1932, "total_steps": 2148, "loss": 0.2188, "lr": 3.077438090945573e-07, "epoch": 2.697512206463613, "percentage": 89.94, "elapsed_time": "4:27:42", "remaining_time": "0:29:55"}
1933
+ {"current_steps": 1933, "total_steps": 2148, "loss": 0.2464, "lr": 3.0494311916052234e-07, "epoch": 2.6989072308765403, "percentage": 89.99, "elapsed_time": "4:27:49", "remaining_time": "0:29:47"}
1934
+ {"current_steps": 1934, "total_steps": 2148, "loss": 0.2486, "lr": 3.021548308002248e-07, "epoch": 2.7003022552894675, "percentage": 90.04, "elapsed_time": "4:28:00", "remaining_time": "0:29:39"}
1935
+ {"current_steps": 1935, "total_steps": 2148, "loss": 0.2329, "lr": 2.9937895137868046e-07, "epoch": 2.701697279702395, "percentage": 90.08, "elapsed_time": "4:28:07", "remaining_time": "0:29:30"}
1936
+ {"current_steps": 1936, "total_steps": 2148, "loss": 0.2162, "lr": 2.9661548822812636e-07, "epoch": 2.703092304115322, "percentage": 90.13, "elapsed_time": "4:28:15", "remaining_time": "0:29:22"}
1937
+ {"current_steps": 1937, "total_steps": 2148, "loss": 0.2554, "lr": 2.9386444864800355e-07, "epoch": 2.7044873285282494, "percentage": 90.18, "elapsed_time": "4:28:22", "remaining_time": "0:29:14"}
1938
+ {"current_steps": 1938, "total_steps": 2148, "loss": 0.2677, "lr": 2.911258399049394e-07, "epoch": 2.7058823529411766, "percentage": 90.22, "elapsed_time": "4:28:31", "remaining_time": "0:29:05"}
1939
+ {"current_steps": 1939, "total_steps": 2148, "loss": 0.2281, "lr": 2.8839966923272286e-07, "epoch": 2.707277377354104, "percentage": 90.27, "elapsed_time": "4:28:38", "remaining_time": "0:28:57"}
1940
+ {"current_steps": 1940, "total_steps": 2148, "loss": 0.2527, "lr": 2.8568594383229067e-07, "epoch": 2.708672401767031, "percentage": 90.32, "elapsed_time": "4:28:46", "remaining_time": "0:28:49"}
1941
+ {"current_steps": 1941, "total_steps": 2148, "loss": 0.2567, "lr": 2.8298467087170655e-07, "epoch": 2.710067426179958, "percentage": 90.36, "elapsed_time": "4:28:53", "remaining_time": "0:28:40"}
1942
+ {"current_steps": 1942, "total_steps": 2148, "loss": 0.2419, "lr": 2.8029585748614196e-07, "epoch": 2.7114624505928853, "percentage": 90.41, "elapsed_time": "4:28:59", "remaining_time": "0:28:32"}
1943
+ {"current_steps": 1943, "total_steps": 2148, "loss": 0.2418, "lr": 2.7761951077785676e-07, "epoch": 2.7128574750058125, "percentage": 90.46, "elapsed_time": "4:29:06", "remaining_time": "0:28:23"}
1944
+ {"current_steps": 1944, "total_steps": 2148, "loss": 0.2247, "lr": 2.749556378161833e-07, "epoch": 2.71425249941874, "percentage": 90.5, "elapsed_time": "4:29:19", "remaining_time": "0:28:15"}
1945
+ {"current_steps": 1945, "total_steps": 2148, "loss": 0.2214, "lr": 2.723042456375036e-07, "epoch": 2.715647523831667, "percentage": 90.55, "elapsed_time": "4:29:25", "remaining_time": "0:28:07"}
1946
+ {"current_steps": 1946, "total_steps": 2148, "loss": 0.2254, "lr": 2.696653412452327e-07, "epoch": 2.7170425482445943, "percentage": 90.6, "elapsed_time": "4:29:32", "remaining_time": "0:27:58"}
1947
+ {"current_steps": 1947, "total_steps": 2148, "loss": 0.2315, "lr": 2.6703893160980266e-07, "epoch": 2.7184375726575216, "percentage": 90.64, "elapsed_time": "4:29:39", "remaining_time": "0:27:50"}
1948
+ {"current_steps": 1948, "total_steps": 2148, "loss": 0.2433, "lr": 2.6442502366863854e-07, "epoch": 2.719832597070449, "percentage": 90.69, "elapsed_time": "4:29:45", "remaining_time": "0:27:41"}
1949
+ {"current_steps": 1949, "total_steps": 2148, "loss": 0.2334, "lr": 2.618236243261452e-07, "epoch": 2.7212276214833757, "percentage": 90.74, "elapsed_time": "4:29:52", "remaining_time": "0:27:33"}
1950
+ {"current_steps": 1950, "total_steps": 2148, "loss": 0.2349, "lr": 2.592347404536888e-07, "epoch": 2.722622645896303, "percentage": 90.78, "elapsed_time": "4:29:58", "remaining_time": "0:27:24"}
1951
+ {"current_steps": 1951, "total_steps": 2148, "loss": 0.2348, "lr": 2.566583788895721e-07, "epoch": 2.7240176703092303, "percentage": 90.83, "elapsed_time": "4:30:05", "remaining_time": "0:27:16"}
1952
+ {"current_steps": 1952, "total_steps": 2148, "loss": 0.2381, "lr": 2.5409454643902543e-07, "epoch": 2.7254126947221575, "percentage": 90.88, "elapsed_time": "4:30:11", "remaining_time": "0:27:07"}
1953
+ {"current_steps": 1953, "total_steps": 2148, "loss": 0.2414, "lr": 2.5154324987418434e-07, "epoch": 2.726807719135085, "percentage": 90.92, "elapsed_time": "4:30:18", "remaining_time": "0:26:59"}
1954
+ {"current_steps": 1954, "total_steps": 2148, "loss": 0.2245, "lr": 2.4900449593406984e-07, "epoch": 2.728202743548012, "percentage": 90.97, "elapsed_time": "4:30:24", "remaining_time": "0:26:50"}
1955
+ {"current_steps": 1955, "total_steps": 2148, "loss": 0.2259, "lr": 2.4647829132457446e-07, "epoch": 2.7295977679609393, "percentage": 91.01, "elapsed_time": "4:30:34", "remaining_time": "0:26:42"}
1956
+ {"current_steps": 1956, "total_steps": 2148, "loss": 0.2207, "lr": 2.439646427184428e-07, "epoch": 2.7309927923738666, "percentage": 91.06, "elapsed_time": "4:30:45", "remaining_time": "0:26:34"}
1957
+ {"current_steps": 1957, "total_steps": 2148, "loss": 0.2292, "lr": 2.4146355675525145e-07, "epoch": 2.732387816786794, "percentage": 91.11, "elapsed_time": "4:30:53", "remaining_time": "0:26:26"}
1958
+ {"current_steps": 1958, "total_steps": 2148, "loss": 0.2481, "lr": 2.389750400413965e-07, "epoch": 2.733782841199721, "percentage": 91.15, "elapsed_time": "4:31:02", "remaining_time": "0:26:18"}
1959
+ {"current_steps": 1959, "total_steps": 2148, "loss": 0.2264, "lr": 2.364990991500743e-07, "epoch": 2.7351778656126484, "percentage": 91.2, "elapsed_time": "4:31:11", "remaining_time": "0:26:09"}
1960
+ {"current_steps": 1960, "total_steps": 2148, "loss": 0.2055, "lr": 2.340357406212601e-07, "epoch": 2.7365728900255757, "percentage": 91.25, "elapsed_time": "4:31:17", "remaining_time": "0:26:01"}
1961
+ {"current_steps": 1961, "total_steps": 2148, "loss": 0.1983, "lr": 2.315849709616963e-07, "epoch": 2.7379679144385025, "percentage": 91.29, "elapsed_time": "4:31:24", "remaining_time": "0:25:52"}
1962
+ {"current_steps": 1962, "total_steps": 2148, "loss": 0.1951, "lr": 2.2914679664487237e-07, "epoch": 2.73936293885143, "percentage": 91.34, "elapsed_time": "4:31:31", "remaining_time": "0:25:44"}
1963
+ {"current_steps": 1963, "total_steps": 2148, "loss": 0.2368, "lr": 2.2672122411100727e-07, "epoch": 2.740757963264357, "percentage": 91.39, "elapsed_time": "4:31:38", "remaining_time": "0:25:36"}
1964
+ {"current_steps": 1964, "total_steps": 2148, "loss": 0.221, "lr": 2.2430825976703485e-07, "epoch": 2.7421529876772843, "percentage": 91.43, "elapsed_time": "4:31:50", "remaining_time": "0:25:28"}
1965
+ {"current_steps": 1965, "total_steps": 2148, "loss": 0.2667, "lr": 2.2190790998658561e-07, "epoch": 2.7435480120902116, "percentage": 91.48, "elapsed_time": "4:31:56", "remaining_time": "0:25:19"}
1966
+ {"current_steps": 1966, "total_steps": 2148, "loss": 0.2194, "lr": 2.1952018110996843e-07, "epoch": 2.744943036503139, "percentage": 91.53, "elapsed_time": "4:32:03", "remaining_time": "0:25:11"}
1967
+ {"current_steps": 1967, "total_steps": 2148, "loss": 0.2541, "lr": 2.1714507944415708e-07, "epoch": 2.746338060916066, "percentage": 91.57, "elapsed_time": "4:32:13", "remaining_time": "0:25:03"}
1968
+ {"current_steps": 1968, "total_steps": 2148, "loss": 0.2181, "lr": 2.1478261126276989e-07, "epoch": 2.7477330853289934, "percentage": 91.62, "elapsed_time": "4:32:26", "remaining_time": "0:24:55"}
1969
+ {"current_steps": 1969, "total_steps": 2148, "loss": 0.2414, "lr": 2.1243278280605517e-07, "epoch": 2.7491281097419202, "percentage": 91.67, "elapsed_time": "4:32:36", "remaining_time": "0:24:46"}
1970
+ {"current_steps": 1970, "total_steps": 2148, "loss": 0.2198, "lr": 2.1009560028087627e-07, "epoch": 2.7505231341548475, "percentage": 91.71, "elapsed_time": "4:32:46", "remaining_time": "0:24:38"}
1971
+ {"current_steps": 1971, "total_steps": 2148, "loss": 0.2335, "lr": 2.0777106986069162e-07, "epoch": 2.7519181585677748, "percentage": 91.76, "elapsed_time": "4:32:55", "remaining_time": "0:24:30"}
1972
+ {"current_steps": 1972, "total_steps": 2148, "loss": 0.2151, "lr": 2.0545919768554078e-07, "epoch": 2.753313182980702, "percentage": 91.81, "elapsed_time": "4:33:03", "remaining_time": "0:24:22"}
1973
+ {"current_steps": 1973, "total_steps": 2148, "loss": 0.2484, "lr": 2.0315998986202902e-07, "epoch": 2.7547082073936293, "percentage": 91.85, "elapsed_time": "4:33:11", "remaining_time": "0:24:13"}
1974
+ {"current_steps": 1974, "total_steps": 2148, "loss": 0.229, "lr": 2.0087345246330714e-07, "epoch": 2.7561032318065566, "percentage": 91.9, "elapsed_time": "4:33:18", "remaining_time": "0:24:05"}
1975
+ {"current_steps": 1975, "total_steps": 2148, "loss": 0.2346, "lr": 1.985995915290595e-07, "epoch": 2.757498256219484, "percentage": 91.95, "elapsed_time": "4:33:25", "remaining_time": "0:23:57"}
1976
+ {"current_steps": 1976, "total_steps": 2148, "loss": 0.213, "lr": 1.9633841306548717e-07, "epoch": 2.758893280632411, "percentage": 91.99, "elapsed_time": "4:33:34", "remaining_time": "0:23:48"}
1977
+ {"current_steps": 1977, "total_steps": 2148, "loss": 0.2505, "lr": 1.9408992304529252e-07, "epoch": 2.7602883050453384, "percentage": 92.04, "elapsed_time": "4:33:50", "remaining_time": "0:23:41"}
1978
+ {"current_steps": 1978, "total_steps": 2148, "loss": 0.1984, "lr": 1.9185412740765962e-07, "epoch": 2.7616833294582657, "percentage": 92.09, "elapsed_time": "4:34:00", "remaining_time": "0:23:33"}
1979
+ {"current_steps": 1979, "total_steps": 2148, "loss": 0.2222, "lr": 1.8963103205824397e-07, "epoch": 2.763078353871193, "percentage": 92.13, "elapsed_time": "4:34:07", "remaining_time": "0:23:24"}
1980
+ {"current_steps": 1980, "total_steps": 2148, "loss": 0.233, "lr": 1.8742064286915329e-07, "epoch": 2.76447337828412, "percentage": 92.18, "elapsed_time": "4:34:14", "remaining_time": "0:23:16"}
1981
+ {"current_steps": 1981, "total_steps": 2148, "loss": 0.25, "lr": 1.8522296567893282e-07, "epoch": 2.765868402697047, "percentage": 92.23, "elapsed_time": "4:34:22", "remaining_time": "0:23:07"}
1982
+ {"current_steps": 1982, "total_steps": 2148, "loss": 0.223, "lr": 1.830380062925513e-07, "epoch": 2.7672634271099743, "percentage": 92.27, "elapsed_time": "4:34:28", "remaining_time": "0:22:59"}
1983
+ {"current_steps": 1983, "total_steps": 2148, "loss": 0.2372, "lr": 1.8086577048138432e-07, "epoch": 2.7686584515229016, "percentage": 92.32, "elapsed_time": "4:34:34", "remaining_time": "0:22:50"}
1984
+ {"current_steps": 1984, "total_steps": 2148, "loss": 0.2201, "lr": 1.787062639831988e-07, "epoch": 2.770053475935829, "percentage": 92.36, "elapsed_time": "4:34:41", "remaining_time": "0:22:42"}
1985
+ {"current_steps": 1985, "total_steps": 2148, "loss": 0.2152, "lr": 1.7655949250213743e-07, "epoch": 2.771448500348756, "percentage": 92.41, "elapsed_time": "4:34:49", "remaining_time": "0:22:34"}
1986
+ {"current_steps": 1986, "total_steps": 2148, "loss": 0.2247, "lr": 1.7442546170870654e-07, "epoch": 2.7728435247616834, "percentage": 92.46, "elapsed_time": "4:34:56", "remaining_time": "0:22:25"}
1987
+ {"current_steps": 1987, "total_steps": 2148, "loss": 0.2408, "lr": 1.7230417723975766e-07, "epoch": 2.7742385491746107, "percentage": 92.5, "elapsed_time": "4:35:06", "remaining_time": "0:22:17"}
1988
+ {"current_steps": 1988, "total_steps": 2148, "loss": 0.2128, "lr": 1.7019564469847372e-07, "epoch": 2.775633573587538, "percentage": 92.55, "elapsed_time": "4:35:16", "remaining_time": "0:22:09"}
1989
+ {"current_steps": 1989, "total_steps": 2148, "loss": 0.205, "lr": 1.6809986965435675e-07, "epoch": 2.7770285980004648, "percentage": 92.6, "elapsed_time": "4:35:23", "remaining_time": "0:22:00"}
1990
+ {"current_steps": 1990, "total_steps": 2148, "loss": 0.2432, "lr": 1.660168576432092e-07, "epoch": 2.778423622413392, "percentage": 92.64, "elapsed_time": "4:35:34", "remaining_time": "0:21:52"}
1991
+ {"current_steps": 1991, "total_steps": 2148, "loss": 0.2215, "lr": 1.6394661416711977e-07, "epoch": 2.7798186468263193, "percentage": 92.69, "elapsed_time": "4:35:44", "remaining_time": "0:21:44"}
1992
+ {"current_steps": 1992, "total_steps": 2148, "loss": 0.2231, "lr": 1.6188914469445372e-07, "epoch": 2.7812136712392466, "percentage": 92.74, "elapsed_time": "4:35:52", "remaining_time": "0:21:36"}
1993
+ {"current_steps": 1993, "total_steps": 2148, "loss": 0.2332, "lr": 1.5984445465983156e-07, "epoch": 2.782608695652174, "percentage": 92.78, "elapsed_time": "4:36:00", "remaining_time": "0:21:27"}
1994
+ {"current_steps": 1994, "total_steps": 2148, "loss": 0.2169, "lr": 1.5781254946412029e-07, "epoch": 2.784003720065101, "percentage": 92.83, "elapsed_time": "4:36:07", "remaining_time": "0:21:19"}
1995
+ {"current_steps": 1995, "total_steps": 2148, "loss": 0.2156, "lr": 1.5579343447441663e-07, "epoch": 2.7853987444780284, "percentage": 92.88, "elapsed_time": "4:36:18", "remaining_time": "0:21:11"}
1996
+ {"current_steps": 1996, "total_steps": 2148, "loss": 0.1899, "lr": 1.5378711502403164e-07, "epoch": 2.7867937688909556, "percentage": 92.92, "elapsed_time": "4:36:25", "remaining_time": "0:21:02"}
1997
+ {"current_steps": 1997, "total_steps": 2148, "loss": 0.2378, "lr": 1.5179359641247948e-07, "epoch": 2.788188793303883, "percentage": 92.97, "elapsed_time": "4:36:32", "remaining_time": "0:20:54"}
1998
+ {"current_steps": 1998, "total_steps": 2148, "loss": 0.2406, "lr": 1.4981288390546188e-07, "epoch": 2.78958381771681, "percentage": 93.02, "elapsed_time": "4:36:39", "remaining_time": "0:20:46"}
1999
+ {"current_steps": 1999, "total_steps": 2148, "loss": 0.2271, "lr": 1.4784498273485436e-07, "epoch": 2.7909788421297375, "percentage": 93.06, "elapsed_time": "4:36:49", "remaining_time": "0:20:38"}
2000
+ {"current_steps": 2000, "total_steps": 2148, "loss": 0.2356, "lr": 1.458898980986917e-07, "epoch": 2.7923738665426647, "percentage": 93.11, "elapsed_time": "4:37:00", "remaining_time": "0:20:29"}
2001
+ {"current_steps": 2001, "total_steps": 2148, "loss": 0.2287, "lr": 1.4394763516115573e-07, "epoch": 2.793768890955592, "percentage": 93.16, "elapsed_time": "4:38:58", "remaining_time": "0:20:29"}
2002
+ {"current_steps": 2002, "total_steps": 2148, "loss": 0.2258, "lr": 1.4201819905256043e-07, "epoch": 2.795163915368519, "percentage": 93.2, "elapsed_time": "4:39:07", "remaining_time": "0:20:21"}
2003
+ {"current_steps": 2003, "total_steps": 2148, "loss": 0.2514, "lr": 1.4010159486933906e-07, "epoch": 2.796558939781446, "percentage": 93.25, "elapsed_time": "4:39:15", "remaining_time": "0:20:12"}
2004
+ {"current_steps": 2004, "total_steps": 2148, "loss": 0.2193, "lr": 1.3819782767403034e-07, "epoch": 2.7979539641943734, "percentage": 93.3, "elapsed_time": "4:39:23", "remaining_time": "0:20:04"}
2005
+ {"current_steps": 2005, "total_steps": 2148, "loss": 0.2356, "lr": 1.363069024952668e-07, "epoch": 2.7993489886073006, "percentage": 93.34, "elapsed_time": "4:39:30", "remaining_time": "0:19:56"}
2006
+ {"current_steps": 2006, "total_steps": 2148, "loss": 0.245, "lr": 1.344288243277575e-07, "epoch": 2.800744013020228, "percentage": 93.39, "elapsed_time": "4:39:38", "remaining_time": "0:19:47"}
2007
+ {"current_steps": 2007, "total_steps": 2148, "loss": 0.2242, "lr": 1.3256359813227758e-07, "epoch": 2.802139037433155, "percentage": 93.44, "elapsed_time": "4:39:47", "remaining_time": "0:19:39"}
2008
+ {"current_steps": 2008, "total_steps": 2148, "loss": 0.246, "lr": 1.3071122883565657e-07, "epoch": 2.8035340618460824, "percentage": 93.48, "elapsed_time": "4:39:54", "remaining_time": "0:19:30"}
2009
+ {"current_steps": 2009, "total_steps": 2148, "loss": 0.2448, "lr": 1.288717213307622e-07, "epoch": 2.8049290862590093, "percentage": 93.53, "elapsed_time": "4:40:02", "remaining_time": "0:19:22"}
2010
+ {"current_steps": 2010, "total_steps": 2148, "loss": 0.2524, "lr": 1.2704508047649e-07, "epoch": 2.8063241106719365, "percentage": 93.58, "elapsed_time": "4:40:08", "remaining_time": "0:19:14"}
2011
+ {"current_steps": 2011, "total_steps": 2148, "loss": 0.2007, "lr": 1.2523131109774822e-07, "epoch": 2.807719135084864, "percentage": 93.62, "elapsed_time": "4:40:19", "remaining_time": "0:19:05"}
2012
+ {"current_steps": 2012, "total_steps": 2148, "loss": 0.2162, "lr": 1.234304179854473e-07, "epoch": 2.809114159497791, "percentage": 93.67, "elapsed_time": "4:40:28", "remaining_time": "0:18:57"}
2013
+ {"current_steps": 2013, "total_steps": 2148, "loss": 0.2266, "lr": 1.2164240589648436e-07, "epoch": 2.8105091839107184, "percentage": 93.72, "elapsed_time": "4:40:40", "remaining_time": "0:18:49"}
2014
+ {"current_steps": 2014, "total_steps": 2148, "loss": 0.2281, "lr": 1.1986727955373588e-07, "epoch": 2.8119042083236456, "percentage": 93.76, "elapsed_time": "4:40:52", "remaining_time": "0:18:41"}
2015
+ {"current_steps": 2015, "total_steps": 2148, "loss": 0.24, "lr": 1.1810504364603737e-07, "epoch": 2.813299232736573, "percentage": 93.81, "elapsed_time": "4:41:00", "remaining_time": "0:18:32"}
2016
+ {"current_steps": 2016, "total_steps": 2148, "loss": 0.2058, "lr": 1.163557028281792e-07, "epoch": 2.8146942571495, "percentage": 93.85, "elapsed_time": "4:41:07", "remaining_time": "0:18:24"}
2017
+ {"current_steps": 2017, "total_steps": 2148, "loss": 0.1974, "lr": 1.146192617208891e-07, "epoch": 2.8160892815624274, "percentage": 93.9, "elapsed_time": "4:41:20", "remaining_time": "0:18:16"}
2018
+ {"current_steps": 2018, "total_steps": 2148, "loss": 0.2076, "lr": 1.128957249108209e-07, "epoch": 2.8174843059753547, "percentage": 93.95, "elapsed_time": "4:41:28", "remaining_time": "0:18:07"}
2019
+ {"current_steps": 2019, "total_steps": 2148, "loss": 0.2085, "lr": 1.1118509695054236e-07, "epoch": 2.818879330388282, "percentage": 93.99, "elapsed_time": "4:41:35", "remaining_time": "0:17:59"}
2020
+ {"current_steps": 2020, "total_steps": 2148, "loss": 0.2078, "lr": 1.094873823585263e-07, "epoch": 2.8202743548012092, "percentage": 94.04, "elapsed_time": "4:41:43", "remaining_time": "0:17:51"}
2021
+ {"current_steps": 2021, "total_steps": 2148, "loss": 0.2367, "lr": 1.0780258561913281e-07, "epoch": 2.8216693792141365, "percentage": 94.09, "elapsed_time": "4:41:51", "remaining_time": "0:17:42"}
2022
+ {"current_steps": 2022, "total_steps": 2148, "loss": 0.2332, "lr": 1.0613071118260321e-07, "epoch": 2.8230644036270633, "percentage": 94.13, "elapsed_time": "4:41:58", "remaining_time": "0:17:34"}
2023
+ {"current_steps": 2023, "total_steps": 2148, "loss": 0.2497, "lr": 1.0447176346504439e-07, "epoch": 2.8244594280399906, "percentage": 94.18, "elapsed_time": "4:42:09", "remaining_time": "0:17:26"}
2024
+ {"current_steps": 2024, "total_steps": 2148, "loss": 0.2507, "lr": 1.0282574684841784e-07, "epoch": 2.825854452452918, "percentage": 94.23, "elapsed_time": "4:42:16", "remaining_time": "0:17:17"}
2025
+ {"current_steps": 2025, "total_steps": 2148, "loss": 0.213, "lr": 1.011926656805301e-07, "epoch": 2.827249476865845, "percentage": 94.27, "elapsed_time": "4:42:31", "remaining_time": "0:17:09"}
2026
+ {"current_steps": 2026, "total_steps": 2148, "loss": 0.2115, "lr": 9.957252427501951e-08, "epoch": 2.8286445012787724, "percentage": 94.32, "elapsed_time": "4:42:39", "remaining_time": "0:17:01"}
2027
+ {"current_steps": 2027, "total_steps": 2148, "loss": 0.2388, "lr": 9.796532691134453e-08, "epoch": 2.8300395256916997, "percentage": 94.37, "elapsed_time": "4:42:49", "remaining_time": "0:16:52"}
2028
+ {"current_steps": 2028, "total_steps": 2148, "loss": 0.2171, "lr": 9.637107783477484e-08, "epoch": 2.831434550104627, "percentage": 94.41, "elapsed_time": "4:42:56", "remaining_time": "0:16:44"}
2029
+ {"current_steps": 2029, "total_steps": 2148, "loss": 0.2061, "lr": 9.478978125637583e-08, "epoch": 2.832829574517554, "percentage": 94.46, "elapsed_time": "4:43:07", "remaining_time": "0:16:36"}
2030
+ {"current_steps": 2030, "total_steps": 2148, "loss": 0.2329, "lr": 9.322144135300137e-08, "epoch": 2.834224598930481, "percentage": 94.51, "elapsed_time": "4:43:17", "remaining_time": "0:16:28"}
2031
+ {"current_steps": 2031, "total_steps": 2148, "loss": 0.2074, "lr": 9.166606226728103e-08, "epoch": 2.8356196233434083, "percentage": 94.55, "elapsed_time": "4:43:24", "remaining_time": "0:16:19"}
2032
+ {"current_steps": 2032, "total_steps": 2148, "loss": 0.2384, "lr": 9.012364810761121e-08, "epoch": 2.8370146477563356, "percentage": 94.6, "elapsed_time": "4:43:32", "remaining_time": "0:16:11"}
2033
+ {"current_steps": 2033, "total_steps": 2148, "loss": 0.2352, "lr": 8.859420294814014e-08, "epoch": 2.838409672169263, "percentage": 94.65, "elapsed_time": "4:43:42", "remaining_time": "0:16:02"}
2034
+ {"current_steps": 2034, "total_steps": 2148, "loss": 0.253, "lr": 8.70777308287618e-08, "epoch": 2.83980469658219, "percentage": 94.69, "elapsed_time": "4:43:49", "remaining_time": "0:15:54"}
2035
+ {"current_steps": 2035, "total_steps": 2148, "loss": 0.2535, "lr": 8.557423575510037e-08, "epoch": 2.8411997209951174, "percentage": 94.74, "elapsed_time": "4:43:58", "remaining_time": "0:15:46"}
2036
+ {"current_steps": 2036, "total_steps": 2148, "loss": 0.2498, "lr": 8.408372169850521e-08, "epoch": 2.8425947454080447, "percentage": 94.79, "elapsed_time": "4:44:12", "remaining_time": "0:15:38"}
2037
+ {"current_steps": 2037, "total_steps": 2148, "loss": 0.2648, "lr": 8.26061925960353e-08, "epoch": 2.843989769820972, "percentage": 94.83, "elapsed_time": "4:44:24", "remaining_time": "0:15:29"}
2038
+ {"current_steps": 2038, "total_steps": 2148, "loss": 0.2425, "lr": 8.114165235045268e-08, "epoch": 2.8453847942338992, "percentage": 94.88, "elapsed_time": "4:44:31", "remaining_time": "0:15:21"}
2039
+ {"current_steps": 2039, "total_steps": 2148, "loss": 0.2298, "lr": 7.969010483020845e-08, "epoch": 2.8467798186468265, "percentage": 94.93, "elapsed_time": "4:44:38", "remaining_time": "0:15:12"}
2040
+ {"current_steps": 2040, "total_steps": 2148, "loss": 0.2355, "lr": 7.825155386943784e-08, "epoch": 2.8481748430597538, "percentage": 94.97, "elapsed_time": "4:44:46", "remaining_time": "0:15:04"}
2041
+ {"current_steps": 2041, "total_steps": 2148, "loss": 0.2419, "lr": 7.682600326794353e-08, "epoch": 2.849569867472681, "percentage": 95.02, "elapsed_time": "4:44:58", "remaining_time": "0:14:56"}
2042
+ {"current_steps": 2042, "total_steps": 2148, "loss": 0.2325, "lr": 7.541345679118961e-08, "epoch": 2.850964891885608, "percentage": 95.07, "elapsed_time": "4:45:07", "remaining_time": "0:14:48"}
2043
+ {"current_steps": 2043, "total_steps": 2148, "loss": 0.2259, "lr": 7.401391817029257e-08, "epoch": 2.852359916298535, "percentage": 95.11, "elapsed_time": "4:45:15", "remaining_time": "0:14:39"}
2044
+ {"current_steps": 2044, "total_steps": 2148, "loss": 0.2272, "lr": 7.262739110200923e-08, "epoch": 2.8537549407114624, "percentage": 95.16, "elapsed_time": "4:45:21", "remaining_time": "0:14:31"}
2045
+ {"current_steps": 2045, "total_steps": 2148, "loss": 0.2544, "lr": 7.125387924872552e-08, "epoch": 2.8551499651243897, "percentage": 95.2, "elapsed_time": "4:45:31", "remaining_time": "0:14:22"}
2046
+ {"current_steps": 2046, "total_steps": 2148, "loss": 0.2132, "lr": 6.98933862384521e-08, "epoch": 2.856544989537317, "percentage": 95.25, "elapsed_time": "4:45:38", "remaining_time": "0:14:14"}