yuzhounie commited on
Commit
c18daa8
·
verified ·
1 Parent(s): 61f03d1

Training in progress, step 2000

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9be3b6a41b0ce05d80d6903f549e820472e0b908599e49b8dab71d6fee82275e
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:728c295871c494d5d0b555809c03f36dcba106eaa33e6137026884eac0bfeaf8
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ce7c5ce0a2ea4c63c9a193414ee30f823d96c672e74ec475533255fef55cd2f4
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6d66d467f2e7d263f57ccdb3228259f9924b289575064881dffdf8d69a2da1f
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:464de9af4b49a93b5aaedc9e30151b924ff14812684c6c8bbd71fecb534fa141
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d63f46e90a48121a44eb6cf9e10cd798565607f016b2c21ae3e932b4feb6b666
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:73a708e88799b98c4c296d3a3c1cf1ed10d0cdbd940d62fa6203bf1d549cc3fc
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6716c227c90308816e0af32cf5e1ef23f5b826876ef0ddc6f0d86d18febdedbf
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -1613,3 +1613,404 @@
1613
  {"current_steps": 1613, "total_steps": 2148, "loss": 0.2215, "lr": 1.7801865376915451e-06, "epoch": 2.252499418739828, "percentage": 75.09, "elapsed_time": "3:45:42", "remaining_time": "1:14:51"}
1614
  {"current_steps": 1614, "total_steps": 2148, "loss": 0.2469, "lr": 1.7739737801346895e-06, "epoch": 2.2538944431527552, "percentage": 75.14, "elapsed_time": "3:45:49", "remaining_time": "1:14:42"}
1615
  {"current_steps": 1615, "total_steps": 2148, "loss": 0.2573, "lr": 1.7677695438381831e-06, "epoch": 2.2552894675656825, "percentage": 75.19, "elapsed_time": "3:45:57", "remaining_time": "1:14:34"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1613
  {"current_steps": 1613, "total_steps": 2148, "loss": 0.2215, "lr": 1.7801865376915451e-06, "epoch": 2.252499418739828, "percentage": 75.09, "elapsed_time": "3:45:42", "remaining_time": "1:14:51"}
1614
  {"current_steps": 1614, "total_steps": 2148, "loss": 0.2469, "lr": 1.7739737801346895e-06, "epoch": 2.2538944431527552, "percentage": 75.14, "elapsed_time": "3:45:49", "remaining_time": "1:14:42"}
1615
  {"current_steps": 1615, "total_steps": 2148, "loss": 0.2573, "lr": 1.7677695438381831e-06, "epoch": 2.2552894675656825, "percentage": 75.19, "elapsed_time": "3:45:57", "remaining_time": "1:14:34"}
1616
+ {"current_steps": 1616, "total_steps": 2148, "loss": 0.2367, "lr": 1.761573845189965e-06, "epoch": 2.2566844919786098, "percentage": 75.23, "elapsed_time": "3:46:05", "remaining_time": "1:14:25"}
1617
+ {"current_steps": 1617, "total_steps": 2148, "loss": 0.2068, "lr": 1.7553867005554215e-06, "epoch": 2.258079516391537, "percentage": 75.28, "elapsed_time": "3:46:13", "remaining_time": "1:14:17"}
1618
+ {"current_steps": 1618, "total_steps": 2148, "loss": 0.2304, "lr": 1.7492081262773397e-06, "epoch": 2.2594745408044643, "percentage": 75.33, "elapsed_time": "3:46:19", "remaining_time": "1:14:08"}
1619
+ {"current_steps": 1619, "total_steps": 2148, "loss": 0.2447, "lr": 1.7430381386758748e-06, "epoch": 2.260869565217391, "percentage": 75.37, "elapsed_time": "3:46:28", "remaining_time": "1:13:59"}
1620
+ {"current_steps": 1620, "total_steps": 2148, "loss": 0.2228, "lr": 1.7368767540484965e-06, "epoch": 2.2622645896303184, "percentage": 75.42, "elapsed_time": "3:46:35", "remaining_time": "1:13:51"}
1621
+ {"current_steps": 1621, "total_steps": 2148, "loss": 0.2541, "lr": 1.7307239886699546e-06, "epoch": 2.2636596140432457, "percentage": 75.47, "elapsed_time": "3:46:42", "remaining_time": "1:13:42"}
1622
+ {"current_steps": 1622, "total_steps": 2148, "loss": 0.2414, "lr": 1.7245798587922263e-06, "epoch": 2.265054638456173, "percentage": 75.51, "elapsed_time": "3:46:48", "remaining_time": "1:13:33"}
1623
+ {"current_steps": 1623, "total_steps": 2148, "loss": 0.2221, "lr": 1.7184443806444851e-06, "epoch": 2.2664496628691, "percentage": 75.56, "elapsed_time": "3:46:58", "remaining_time": "1:13:25"}
1624
+ {"current_steps": 1624, "total_steps": 2148, "loss": 0.2194, "lr": 1.7123175704330514e-06, "epoch": 2.2678446872820275, "percentage": 75.61, "elapsed_time": "3:47:06", "remaining_time": "1:13:16"}
1625
+ {"current_steps": 1625, "total_steps": 2148, "loss": 0.2393, "lr": 1.706199444341341e-06, "epoch": 2.2692397116949548, "percentage": 75.65, "elapsed_time": "3:47:15", "remaining_time": "1:13:08"}
1626
+ {"current_steps": 1626, "total_steps": 2148, "loss": 0.2729, "lr": 1.7000900185298418e-06, "epoch": 2.270634736107882, "percentage": 75.7, "elapsed_time": "3:47:21", "remaining_time": "1:12:59"}
1627
+ {"current_steps": 1627, "total_steps": 2148, "loss": 0.2609, "lr": 1.6939893091360577e-06, "epoch": 2.2720297605208093, "percentage": 75.74, "elapsed_time": "3:47:32", "remaining_time": "1:12:51"}
1628
+ {"current_steps": 1628, "total_steps": 2148, "loss": 0.2266, "lr": 1.6878973322744658e-06, "epoch": 2.273424784933736, "percentage": 75.79, "elapsed_time": "3:47:38", "remaining_time": "1:12:42"}
1629
+ {"current_steps": 1629, "total_steps": 2148, "loss": 0.2307, "lr": 1.6818141040364816e-06, "epoch": 2.2748198093466634, "percentage": 75.84, "elapsed_time": "3:47:46", "remaining_time": "1:12:34"}
1630
+ {"current_steps": 1630, "total_steps": 2148, "loss": 0.2243, "lr": 1.6757396404904087e-06, "epoch": 2.2762148337595907, "percentage": 75.88, "elapsed_time": "3:47:53", "remaining_time": "1:12:25"}
1631
+ {"current_steps": 1631, "total_steps": 2148, "loss": 0.2401, "lr": 1.6696739576813981e-06, "epoch": 2.277609858172518, "percentage": 75.93, "elapsed_time": "3:48:03", "remaining_time": "1:12:17"}
1632
+ {"current_steps": 1632, "total_steps": 2148, "loss": 0.2659, "lr": 1.6636170716314114e-06, "epoch": 2.279004882585445, "percentage": 75.98, "elapsed_time": "3:48:09", "remaining_time": "1:12:08"}
1633
+ {"current_steps": 1633, "total_steps": 2148, "loss": 0.2615, "lr": 1.657568998339175e-06, "epoch": 2.2803999069983725, "percentage": 76.02, "elapsed_time": "3:48:16", "remaining_time": "1:11:59"}
1634
+ {"current_steps": 1634, "total_steps": 2148, "loss": 0.2491, "lr": 1.6515297537801305e-06, "epoch": 2.2817949314112997, "percentage": 76.07, "elapsed_time": "3:48:22", "remaining_time": "1:11:50"}
1635
+ {"current_steps": 1635, "total_steps": 2148, "loss": 0.2178, "lr": 1.6454993539064075e-06, "epoch": 2.283189955824227, "percentage": 76.12, "elapsed_time": "3:48:30", "remaining_time": "1:11:41"}
1636
+ {"current_steps": 1636, "total_steps": 2148, "loss": 0.2665, "lr": 1.6394778146467672e-06, "epoch": 2.2845849802371543, "percentage": 76.16, "elapsed_time": "3:48:42", "remaining_time": "1:11:34"}
1637
+ {"current_steps": 1637, "total_steps": 2148, "loss": 0.2576, "lr": 1.6334651519065658e-06, "epoch": 2.2859800046500816, "percentage": 76.21, "elapsed_time": "3:48:49", "remaining_time": "1:11:25"}
1638
+ {"current_steps": 1638, "total_steps": 2148, "loss": 0.2468, "lr": 1.6274613815677176e-06, "epoch": 2.287375029063009, "percentage": 76.26, "elapsed_time": "3:48:58", "remaining_time": "1:11:17"}
1639
+ {"current_steps": 1639, "total_steps": 2148, "loss": 0.2001, "lr": 1.6214665194886474e-06, "epoch": 2.2887700534759357, "percentage": 76.3, "elapsed_time": "3:49:07", "remaining_time": "1:11:09"}
1640
+ {"current_steps": 1640, "total_steps": 2148, "loss": 0.2098, "lr": 1.6154805815042457e-06, "epoch": 2.290165077888863, "percentage": 76.35, "elapsed_time": "3:49:15", "remaining_time": "1:11:00"}
1641
+ {"current_steps": 1641, "total_steps": 2148, "loss": 0.2459, "lr": 1.6095035834258365e-06, "epoch": 2.29156010230179, "percentage": 76.4, "elapsed_time": "3:49:21", "remaining_time": "1:10:51"}
1642
+ {"current_steps": 1642, "total_steps": 2148, "loss": 0.2003, "lr": 1.6035355410411252e-06, "epoch": 2.2929551267147175, "percentage": 76.44, "elapsed_time": "3:49:28", "remaining_time": "1:10:43"}
1643
+ {"current_steps": 1643, "total_steps": 2148, "loss": 0.2358, "lr": 1.5975764701141611e-06, "epoch": 2.2943501511276447, "percentage": 76.49, "elapsed_time": "3:49:38", "remaining_time": "1:10:34"}
1644
+ {"current_steps": 1644, "total_steps": 2148, "loss": 0.2404, "lr": 1.5916263863853e-06, "epoch": 2.295745175540572, "percentage": 76.54, "elapsed_time": "3:49:48", "remaining_time": "1:10:27"}
1645
+ {"current_steps": 1645, "total_steps": 2148, "loss": 0.2669, "lr": 1.585685305571159e-06, "epoch": 2.2971401999534993, "percentage": 76.58, "elapsed_time": "3:49:57", "remaining_time": "1:10:19"}
1646
+ {"current_steps": 1646, "total_steps": 2148, "loss": 0.2259, "lr": 1.5797532433645696e-06, "epoch": 2.2985352243664265, "percentage": 76.63, "elapsed_time": "3:50:06", "remaining_time": "1:10:10"}
1647
+ {"current_steps": 1647, "total_steps": 2148, "loss": 0.2349, "lr": 1.5738302154345475e-06, "epoch": 2.299930248779354, "percentage": 76.68, "elapsed_time": "3:50:19", "remaining_time": "1:10:03"}
1648
+ {"current_steps": 1648, "total_steps": 2148, "loss": 0.2349, "lr": 1.5679162374262414e-06, "epoch": 2.3013252731922806, "percentage": 76.72, "elapsed_time": "3:50:26", "remaining_time": "1:09:54"}
1649
+ {"current_steps": 1649, "total_steps": 2148, "loss": 0.253, "lr": 1.5620113249608943e-06, "epoch": 2.302720297605208, "percentage": 76.77, "elapsed_time": "3:50:33", "remaining_time": "1:09:45"}
1650
+ {"current_steps": 1650, "total_steps": 2148, "loss": 0.2402, "lr": 1.5561154936358069e-06, "epoch": 2.304115322018135, "percentage": 76.82, "elapsed_time": "3:50:42", "remaining_time": "1:09:38"}
1651
+ {"current_steps": 1651, "total_steps": 2148, "loss": 0.2286, "lr": 1.5502287590242942e-06, "epoch": 2.3055103464310625, "percentage": 76.86, "elapsed_time": "3:50:51", "remaining_time": "1:09:29"}
1652
+ {"current_steps": 1652, "total_steps": 2148, "loss": 0.2153, "lr": 1.5443511366756375e-06, "epoch": 2.3069053708439897, "percentage": 76.91, "elapsed_time": "3:50:58", "remaining_time": "1:09:20"}
1653
+ {"current_steps": 1653, "total_steps": 2148, "loss": 0.2437, "lr": 1.53848264211505e-06, "epoch": 2.308300395256917, "percentage": 76.96, "elapsed_time": "3:51:04", "remaining_time": "1:09:11"}
1654
+ {"current_steps": 1654, "total_steps": 2148, "loss": 0.2146, "lr": 1.5326232908436405e-06, "epoch": 2.3096954196698443, "percentage": 77.0, "elapsed_time": "3:51:13", "remaining_time": "1:09:03"}
1655
+ {"current_steps": 1655, "total_steps": 2148, "loss": 0.2328, "lr": 1.526773098338359e-06, "epoch": 2.3110904440827715, "percentage": 77.05, "elapsed_time": "3:51:21", "remaining_time": "1:08:55"}
1656
+ {"current_steps": 1656, "total_steps": 2148, "loss": 0.2315, "lr": 1.5209320800519683e-06, "epoch": 2.312485468495699, "percentage": 77.09, "elapsed_time": "3:51:29", "remaining_time": "1:08:46"}
1657
+ {"current_steps": 1657, "total_steps": 2148, "loss": 0.2503, "lr": 1.515100251412998e-06, "epoch": 2.313880492908626, "percentage": 77.14, "elapsed_time": "3:51:39", "remaining_time": "1:08:38"}
1658
+ {"current_steps": 1658, "total_steps": 2148, "loss": 0.227, "lr": 1.5092776278257027e-06, "epoch": 2.3152755173215533, "percentage": 77.19, "elapsed_time": "3:51:52", "remaining_time": "1:08:31"}
1659
+ {"current_steps": 1659, "total_steps": 2148, "loss": 0.2401, "lr": 1.5034642246700203e-06, "epoch": 2.31667054173448, "percentage": 77.23, "elapsed_time": "3:52:01", "remaining_time": "1:08:23"}
1660
+ {"current_steps": 1660, "total_steps": 2148, "loss": 0.2516, "lr": 1.4976600573015398e-06, "epoch": 2.3180655661474074, "percentage": 77.28, "elapsed_time": "3:52:08", "remaining_time": "1:08:14"}
1661
+ {"current_steps": 1661, "total_steps": 2148, "loss": 0.2487, "lr": 1.4918651410514479e-06, "epoch": 2.3194605905603347, "percentage": 77.33, "elapsed_time": "3:52:17", "remaining_time": "1:08:06"}
1662
+ {"current_steps": 1662, "total_steps": 2148, "loss": 0.2185, "lr": 1.486079491226501e-06, "epoch": 2.320855614973262, "percentage": 77.37, "elapsed_time": "3:52:24", "remaining_time": "1:07:57"}
1663
+ {"current_steps": 1663, "total_steps": 2148, "loss": 0.2273, "lr": 1.4803031231089782e-06, "epoch": 2.3222506393861893, "percentage": 77.42, "elapsed_time": "3:52:34", "remaining_time": "1:07:49"}
1664
+ {"current_steps": 1664, "total_steps": 2148, "loss": 0.2257, "lr": 1.4745360519566382e-06, "epoch": 2.3236456637991165, "percentage": 77.47, "elapsed_time": "3:52:44", "remaining_time": "1:07:41"}
1665
+ {"current_steps": 1665, "total_steps": 2148, "loss": 0.2519, "lr": 1.4687782930026833e-06, "epoch": 2.325040688212044, "percentage": 77.51, "elapsed_time": "3:52:50", "remaining_time": "1:07:32"}
1666
+ {"current_steps": 1666, "total_steps": 2148, "loss": 0.2305, "lr": 1.4630298614557236e-06, "epoch": 2.326435712624971, "percentage": 77.56, "elapsed_time": "3:52:57", "remaining_time": "1:07:23"}
1667
+ {"current_steps": 1667, "total_steps": 2148, "loss": 0.2738, "lr": 1.4572907724997249e-06, "epoch": 2.3278307370378983, "percentage": 77.61, "elapsed_time": "3:53:07", "remaining_time": "1:07:15"}
1668
+ {"current_steps": 1668, "total_steps": 2148, "loss": 0.222, "lr": 1.4515610412939791e-06, "epoch": 2.329225761450825, "percentage": 77.65, "elapsed_time": "3:53:14", "remaining_time": "1:07:07"}
1669
+ {"current_steps": 1669, "total_steps": 2148, "loss": 0.2429, "lr": 1.445840682973062e-06, "epoch": 2.3306207858637524, "percentage": 77.7, "elapsed_time": "3:53:20", "remaining_time": "1:06:58"}
1670
+ {"current_steps": 1670, "total_steps": 2148, "loss": 0.2113, "lr": 1.4401297126467884e-06, "epoch": 2.3320158102766797, "percentage": 77.75, "elapsed_time": "3:53:27", "remaining_time": "1:06:49"}
1671
+ {"current_steps": 1671, "total_steps": 2148, "loss": 0.2057, "lr": 1.4344281454001751e-06, "epoch": 2.333410834689607, "percentage": 77.79, "elapsed_time": "3:53:36", "remaining_time": "1:06:41"}
1672
+ {"current_steps": 1672, "total_steps": 2148, "loss": 0.2485, "lr": 1.4287359962934055e-06, "epoch": 2.3348058591025342, "percentage": 77.84, "elapsed_time": "3:53:44", "remaining_time": "1:06:32"}
1673
+ {"current_steps": 1673, "total_steps": 2148, "loss": 0.2534, "lr": 1.4230532803617814e-06, "epoch": 2.3362008835154615, "percentage": 77.89, "elapsed_time": "3:53:55", "remaining_time": "1:06:24"}
1674
+ {"current_steps": 1674, "total_steps": 2148, "loss": 0.2418, "lr": 1.4173800126156916e-06, "epoch": 2.337595907928389, "percentage": 77.93, "elapsed_time": "3:54:02", "remaining_time": "1:06:16"}
1675
+ {"current_steps": 1675, "total_steps": 2148, "loss": 0.2237, "lr": 1.411716208040566e-06, "epoch": 2.338990932341316, "percentage": 77.98, "elapsed_time": "3:54:11", "remaining_time": "1:06:07"}
1676
+ {"current_steps": 1676, "total_steps": 2148, "loss": 0.2487, "lr": 1.4060618815968375e-06, "epoch": 2.3403859567542433, "percentage": 78.03, "elapsed_time": "3:54:19", "remaining_time": "1:05:59"}
1677
+ {"current_steps": 1677, "total_steps": 2148, "loss": 0.264, "lr": 1.4004170482199054e-06, "epoch": 2.3417809811671706, "percentage": 78.07, "elapsed_time": "3:54:28", "remaining_time": "1:05:51"}
1678
+ {"current_steps": 1678, "total_steps": 2148, "loss": 0.209, "lr": 1.3947817228200956e-06, "epoch": 2.343176005580098, "percentage": 78.12, "elapsed_time": "3:54:35", "remaining_time": "1:05:42"}
1679
+ {"current_steps": 1679, "total_steps": 2148, "loss": 0.2622, "lr": 1.3891559202826133e-06, "epoch": 2.3445710299930247, "percentage": 78.17, "elapsed_time": "3:54:43", "remaining_time": "1:05:34"}
1680
+ {"current_steps": 1680, "total_steps": 2148, "loss": 0.2378, "lr": 1.3835396554675179e-06, "epoch": 2.345966054405952, "percentage": 78.21, "elapsed_time": "3:54:51", "remaining_time": "1:05:25"}
1681
+ {"current_steps": 1681, "total_steps": 2148, "loss": 0.2608, "lr": 1.37793294320967e-06, "epoch": 2.3473610788188792, "percentage": 78.26, "elapsed_time": "3:54:59", "remaining_time": "1:05:16"}
1682
+ {"current_steps": 1682, "total_steps": 2148, "loss": 0.2163, "lr": 1.3723357983186974e-06, "epoch": 2.3487561032318065, "percentage": 78.31, "elapsed_time": "3:55:06", "remaining_time": "1:05:08"}
1683
+ {"current_steps": 1683, "total_steps": 2148, "loss": 0.2248, "lr": 1.3667482355789607e-06, "epoch": 2.3501511276447338, "percentage": 78.35, "elapsed_time": "3:55:13", "remaining_time": "1:04:59"}
1684
+ {"current_steps": 1684, "total_steps": 2148, "loss": 0.2131, "lr": 1.3611702697495088e-06, "epoch": 2.351546152057661, "percentage": 78.4, "elapsed_time": "3:55:20", "remaining_time": "1:04:50"}
1685
+ {"current_steps": 1685, "total_steps": 2148, "loss": 0.2329, "lr": 1.3556019155640416e-06, "epoch": 2.3529411764705883, "percentage": 78.45, "elapsed_time": "3:55:29", "remaining_time": "1:04:42"}
1686
+ {"current_steps": 1686, "total_steps": 2148, "loss": 0.2395, "lr": 1.350043187730868e-06, "epoch": 2.3543362008835156, "percentage": 78.49, "elapsed_time": "3:55:37", "remaining_time": "1:04:33"}
1687
+ {"current_steps": 1687, "total_steps": 2148, "loss": 0.2343, "lr": 1.34449410093287e-06, "epoch": 2.355731225296443, "percentage": 78.54, "elapsed_time": "3:55:44", "remaining_time": "1:04:25"}
1688
+ {"current_steps": 1688, "total_steps": 2148, "loss": 0.2171, "lr": 1.3389546698274686e-06, "epoch": 2.3571262497093697, "percentage": 78.58, "elapsed_time": "3:55:52", "remaining_time": "1:04:16"}
1689
+ {"current_steps": 1689, "total_steps": 2148, "loss": 0.2495, "lr": 1.333424909046574e-06, "epoch": 2.358521274122297, "percentage": 78.63, "elapsed_time": "3:56:00", "remaining_time": "1:04:08"}
1690
+ {"current_steps": 1690, "total_steps": 2148, "loss": 0.2586, "lr": 1.327904833196556e-06, "epoch": 2.359916298535224, "percentage": 78.68, "elapsed_time": "3:56:07", "remaining_time": "1:03:59"}
1691
+ {"current_steps": 1691, "total_steps": 2148, "loss": 0.215, "lr": 1.3223944568582047e-06, "epoch": 2.3613113229481515, "percentage": 78.72, "elapsed_time": "3:56:14", "remaining_time": "1:03:50"}
1692
+ {"current_steps": 1692, "total_steps": 2148, "loss": 0.2276, "lr": 1.3168937945866861e-06, "epoch": 2.3627063473610788, "percentage": 78.77, "elapsed_time": "3:56:23", "remaining_time": "1:03:42"}
1693
+ {"current_steps": 1693, "total_steps": 2148, "loss": 0.241, "lr": 1.311402860911507e-06, "epoch": 2.364101371774006, "percentage": 78.82, "elapsed_time": "3:56:31", "remaining_time": "1:03:34"}
1694
+ {"current_steps": 1694, "total_steps": 2148, "loss": 0.2167, "lr": 1.3059216703364814e-06, "epoch": 2.3654963961869333, "percentage": 78.86, "elapsed_time": "3:56:39", "remaining_time": "1:03:25"}
1695
+ {"current_steps": 1695, "total_steps": 2148, "loss": 0.2358, "lr": 1.3004502373396821e-06, "epoch": 2.3668914205998606, "percentage": 78.91, "elapsed_time": "3:56:46", "remaining_time": "1:03:16"}
1696
+ {"current_steps": 1696, "total_steps": 2148, "loss": 0.2423, "lr": 1.2949885763734127e-06, "epoch": 2.368286445012788, "percentage": 78.96, "elapsed_time": "3:56:53", "remaining_time": "1:03:07"}
1697
+ {"current_steps": 1697, "total_steps": 2148, "loss": 0.2244, "lr": 1.2895367018641658e-06, "epoch": 2.369681469425715, "percentage": 79.0, "elapsed_time": "3:56:59", "remaining_time": "1:02:59"}
1698
+ {"current_steps": 1698, "total_steps": 2148, "loss": 0.2582, "lr": 1.284094628212576e-06, "epoch": 2.3710764938386424, "percentage": 79.05, "elapsed_time": "3:57:07", "remaining_time": "1:02:50"}
1699
+ {"current_steps": 1699, "total_steps": 2148, "loss": 0.2202, "lr": 1.278662369793398e-06, "epoch": 2.372471518251569, "percentage": 79.1, "elapsed_time": "3:57:13", "remaining_time": "1:02:41"}
1700
+ {"current_steps": 1700, "total_steps": 2148, "loss": 0.2572, "lr": 1.273239940955459e-06, "epoch": 2.3738665426644965, "percentage": 79.14, "elapsed_time": "3:57:20", "remaining_time": "1:02:32"}
1701
+ {"current_steps": 1701, "total_steps": 2148, "loss": 0.2617, "lr": 1.267827356021618e-06, "epoch": 2.3752615670774238, "percentage": 79.19, "elapsed_time": "3:57:31", "remaining_time": "1:02:25"}
1702
+ {"current_steps": 1702, "total_steps": 2148, "loss": 0.2349, "lr": 1.2624246292887377e-06, "epoch": 2.376656591490351, "percentage": 79.24, "elapsed_time": "3:57:40", "remaining_time": "1:02:16"}
1703
+ {"current_steps": 1703, "total_steps": 2148, "loss": 0.258, "lr": 1.2570317750276374e-06, "epoch": 2.3780516159032783, "percentage": 79.28, "elapsed_time": "3:57:47", "remaining_time": "1:02:08"}
1704
+ {"current_steps": 1704, "total_steps": 2148, "loss": 0.2477, "lr": 1.2516488074830586e-06, "epoch": 2.3794466403162056, "percentage": 79.33, "elapsed_time": "3:57:53", "remaining_time": "1:01:59"}
1705
+ {"current_steps": 1705, "total_steps": 2148, "loss": 0.2331, "lr": 1.246275740873631e-06, "epoch": 2.380841664729133, "percentage": 79.38, "elapsed_time": "3:58:00", "remaining_time": "1:01:50"}
1706
+ {"current_steps": 1706, "total_steps": 2148, "loss": 0.2542, "lr": 1.2409125893918329e-06, "epoch": 2.38223668914206, "percentage": 79.42, "elapsed_time": "3:58:09", "remaining_time": "1:01:42"}
1707
+ {"current_steps": 1707, "total_steps": 2148, "loss": 0.202, "lr": 1.2355593672039462e-06, "epoch": 2.3836317135549874, "percentage": 79.47, "elapsed_time": "3:58:20", "remaining_time": "1:01:34"}
1708
+ {"current_steps": 1708, "total_steps": 2148, "loss": 0.2609, "lr": 1.2302160884500337e-06, "epoch": 2.385026737967914, "percentage": 79.52, "elapsed_time": "3:58:26", "remaining_time": "1:01:25"}
1709
+ {"current_steps": 1709, "total_steps": 2148, "loss": 0.2035, "lr": 1.2248827672438868e-06, "epoch": 2.3864217623808415, "percentage": 79.56, "elapsed_time": "3:58:35", "remaining_time": "1:01:17"}
1710
+ {"current_steps": 1710, "total_steps": 2148, "loss": 0.2388, "lr": 1.2195594176729963e-06, "epoch": 2.3878167867937687, "percentage": 79.61, "elapsed_time": "3:58:45", "remaining_time": "1:01:09"}
1711
+ {"current_steps": 1711, "total_steps": 2148, "loss": 0.2303, "lr": 1.2142460537985168e-06, "epoch": 2.389211811206696, "percentage": 79.66, "elapsed_time": "3:58:52", "remaining_time": "1:01:00"}
1712
+ {"current_steps": 1712, "total_steps": 2148, "loss": 0.2269, "lr": 1.2089426896552265e-06, "epoch": 2.3906068356196233, "percentage": 79.7, "elapsed_time": "3:58:59", "remaining_time": "1:00:51"}
1713
+ {"current_steps": 1713, "total_steps": 2148, "loss": 0.2637, "lr": 1.2036493392514847e-06, "epoch": 2.3920018600325506, "percentage": 79.75, "elapsed_time": "3:59:06", "remaining_time": "1:00:43"}
1714
+ {"current_steps": 1714, "total_steps": 2148, "loss": 0.2096, "lr": 1.1983660165692078e-06, "epoch": 2.393396884445478, "percentage": 79.8, "elapsed_time": "3:59:13", "remaining_time": "1:00:34"}
1715
+ {"current_steps": 1715, "total_steps": 2148, "loss": 0.2436, "lr": 1.1930927355638189e-06, "epoch": 2.394791908858405, "percentage": 79.84, "elapsed_time": "3:59:22", "remaining_time": "1:00:26"}
1716
+ {"current_steps": 1716, "total_steps": 2148, "loss": 0.2319, "lr": 1.1878295101642185e-06, "epoch": 2.3961869332713324, "percentage": 79.89, "elapsed_time": "3:59:31", "remaining_time": "1:00:17"}
1717
+ {"current_steps": 1717, "total_steps": 2148, "loss": 0.2276, "lr": 1.182576354272748e-06, "epoch": 2.3975819576842596, "percentage": 79.93, "elapsed_time": "3:59:38", "remaining_time": "1:00:09"}
1718
+ {"current_steps": 1718, "total_steps": 2148, "loss": 0.2295, "lr": 1.1773332817651512e-06, "epoch": 2.398976982097187, "percentage": 79.98, "elapsed_time": "3:59:48", "remaining_time": "1:00:01"}
1719
+ {"current_steps": 1719, "total_steps": 2148, "loss": 0.2133, "lr": 1.1721003064905329e-06, "epoch": 2.400372006510114, "percentage": 80.03, "elapsed_time": "3:59:55", "remaining_time": "0:59:52"}
1720
+ {"current_steps": 1720, "total_steps": 2148, "loss": 0.2396, "lr": 1.1668774422713336e-06, "epoch": 2.401767030923041, "percentage": 80.07, "elapsed_time": "4:00:02", "remaining_time": "0:59:43"}
1721
+ {"current_steps": 1721, "total_steps": 2148, "loss": 0.2383, "lr": 1.1616647029032818e-06, "epoch": 2.4031620553359683, "percentage": 80.12, "elapsed_time": "4:00:16", "remaining_time": "0:59:36"}
1722
+ {"current_steps": 1722, "total_steps": 2148, "loss": 0.2294, "lr": 1.1564621021553617e-06, "epoch": 2.4045570797488955, "percentage": 80.17, "elapsed_time": "4:00:26", "remaining_time": "0:59:28"}
1723
+ {"current_steps": 1723, "total_steps": 2148, "loss": 0.2628, "lr": 1.1512696537697804e-06, "epoch": 2.405952104161823, "percentage": 80.21, "elapsed_time": "4:00:32", "remaining_time": "0:59:19"}
1724
+ {"current_steps": 1724, "total_steps": 2148, "loss": 0.2684, "lr": 1.1460873714619275e-06, "epoch": 2.40734712857475, "percentage": 80.26, "elapsed_time": "4:00:39", "remaining_time": "0:59:11"}
1725
+ {"current_steps": 1725, "total_steps": 2148, "loss": 0.2423, "lr": 1.140915268920339e-06, "epoch": 2.4087421529876774, "percentage": 80.31, "elapsed_time": "4:00:46", "remaining_time": "0:59:02"}
1726
+ {"current_steps": 1726, "total_steps": 2148, "loss": 0.2245, "lr": 1.13575335980666e-06, "epoch": 2.4101371774006046, "percentage": 80.35, "elapsed_time": "4:00:52", "remaining_time": "0:58:53"}
1727
+ {"current_steps": 1727, "total_steps": 2148, "loss": 0.2221, "lr": 1.130601657755616e-06, "epoch": 2.411532201813532, "percentage": 80.4, "elapsed_time": "4:01:02", "remaining_time": "0:58:45"}
1728
+ {"current_steps": 1728, "total_steps": 2148, "loss": 0.227, "lr": 1.125460176374965e-06, "epoch": 2.4129272262264587, "percentage": 80.45, "elapsed_time": "4:01:08", "remaining_time": "0:58:36"}
1729
+ {"current_steps": 1729, "total_steps": 2148, "loss": 0.2523, "lr": 1.1203289292454728e-06, "epoch": 2.414322250639386, "percentage": 80.49, "elapsed_time": "4:01:16", "remaining_time": "0:58:28"}
1730
+ {"current_steps": 1730, "total_steps": 2148, "loss": 0.2486, "lr": 1.1152079299208724e-06, "epoch": 2.4157172750523133, "percentage": 80.54, "elapsed_time": "4:01:27", "remaining_time": "0:58:20"}
1731
+ {"current_steps": 1731, "total_steps": 2148, "loss": 0.2286, "lr": 1.1100971919278247e-06, "epoch": 2.4171122994652405, "percentage": 80.59, "elapsed_time": "4:01:34", "remaining_time": "0:58:11"}
1732
+ {"current_steps": 1732, "total_steps": 2148, "loss": 0.2471, "lr": 1.104996728765887e-06, "epoch": 2.418507323878168, "percentage": 80.63, "elapsed_time": "4:01:42", "remaining_time": "0:58:03"}
1733
+ {"current_steps": 1733, "total_steps": 2148, "loss": 0.2395, "lr": 1.0999065539074793e-06, "epoch": 2.419902348291095, "percentage": 80.68, "elapsed_time": "4:01:51", "remaining_time": "0:57:55"}
1734
+ {"current_steps": 1734, "total_steps": 2148, "loss": 0.2323, "lr": 1.094826680797843e-06, "epoch": 2.4212973727040223, "percentage": 80.73, "elapsed_time": "4:01:59", "remaining_time": "0:57:46"}
1735
+ {"current_steps": 1735, "total_steps": 2148, "loss": 0.2472, "lr": 1.0897571228550097e-06, "epoch": 2.4226923971169496, "percentage": 80.77, "elapsed_time": "4:02:07", "remaining_time": "0:57:38"}
1736
+ {"current_steps": 1736, "total_steps": 2148, "loss": 0.2422, "lr": 1.0846978934697666e-06, "epoch": 2.424087421529877, "percentage": 80.82, "elapsed_time": "4:02:15", "remaining_time": "0:57:29"}
1737
+ {"current_steps": 1737, "total_steps": 2148, "loss": 0.2313, "lr": 1.0796490060056142e-06, "epoch": 2.425482445942804, "percentage": 80.87, "elapsed_time": "4:02:22", "remaining_time": "0:57:21"}
1738
+ {"current_steps": 1738, "total_steps": 2148, "loss": 0.2287, "lr": 1.074610473798738e-06, "epoch": 2.4268774703557314, "percentage": 80.91, "elapsed_time": "4:02:30", "remaining_time": "0:57:12"}
1739
+ {"current_steps": 1739, "total_steps": 2148, "loss": 0.2227, "lr": 1.0695823101579728e-06, "epoch": 2.4282724947686587, "percentage": 80.96, "elapsed_time": "4:02:36", "remaining_time": "0:57:03"}
1740
+ {"current_steps": 1740, "total_steps": 2148, "loss": 0.2395, "lr": 1.0645645283647616e-06, "epoch": 2.4296675191815855, "percentage": 81.01, "elapsed_time": "4:02:43", "remaining_time": "0:56:54"}
1741
+ {"current_steps": 1741, "total_steps": 2148, "loss": 0.228, "lr": 1.0595571416731293e-06, "epoch": 2.431062543594513, "percentage": 81.05, "elapsed_time": "4:02:52", "remaining_time": "0:56:46"}
1742
+ {"current_steps": 1742, "total_steps": 2148, "loss": 0.2213, "lr": 1.0545601633096414e-06, "epoch": 2.43245756800744, "percentage": 81.1, "elapsed_time": "4:02:59", "remaining_time": "0:56:37"}
1743
+ {"current_steps": 1743, "total_steps": 2148, "loss": 0.245, "lr": 1.049573606473369e-06, "epoch": 2.4338525924203673, "percentage": 81.15, "elapsed_time": "4:03:06", "remaining_time": "0:56:29"}
1744
+ {"current_steps": 1744, "total_steps": 2148, "loss": 0.2079, "lr": 1.0445974843358563e-06, "epoch": 2.4352476168332946, "percentage": 81.19, "elapsed_time": "4:03:13", "remaining_time": "0:56:20"}
1745
+ {"current_steps": 1745, "total_steps": 2148, "loss": 0.2241, "lr": 1.0396318100410868e-06, "epoch": 2.436642641246222, "percentage": 81.24, "elapsed_time": "4:03:19", "remaining_time": "0:56:11"}
1746
+ {"current_steps": 1746, "total_steps": 2148, "loss": 0.2574, "lr": 1.0346765967054472e-06, "epoch": 2.438037665659149, "percentage": 81.28, "elapsed_time": "4:03:25", "remaining_time": "0:56:02"}
1747
+ {"current_steps": 1747, "total_steps": 2148, "loss": 0.2589, "lr": 1.029731857417689e-06, "epoch": 2.4394326900720764, "percentage": 81.33, "elapsed_time": "4:03:31", "remaining_time": "0:55:53"}
1748
+ {"current_steps": 1748, "total_steps": 2148, "loss": 0.2377, "lr": 1.0247976052389018e-06, "epoch": 2.4408277144850032, "percentage": 81.38, "elapsed_time": "4:03:38", "remaining_time": "0:55:45"}
1749
+ {"current_steps": 1749, "total_steps": 2148, "loss": 0.2201, "lr": 1.0198738532024715e-06, "epoch": 2.4422227388979305, "percentage": 81.42, "elapsed_time": "4:03:45", "remaining_time": "0:55:36"}
1750
+ {"current_steps": 1750, "total_steps": 2148, "loss": 0.2464, "lr": 1.0149606143140484e-06, "epoch": 2.443617763310858, "percentage": 81.47, "elapsed_time": "4:03:52", "remaining_time": "0:55:27"}
1751
+ {"current_steps": 1751, "total_steps": 2148, "loss": 0.2387, "lr": 1.0100579015515156e-06, "epoch": 2.445012787723785, "percentage": 81.52, "elapsed_time": "4:04:00", "remaining_time": "0:55:19"}
1752
+ {"current_steps": 1752, "total_steps": 2148, "loss": 0.2382, "lr": 1.005165727864953e-06, "epoch": 2.4464078121367123, "percentage": 81.56, "elapsed_time": "4:04:07", "remaining_time": "0:55:10"}
1753
+ {"current_steps": 1753, "total_steps": 2148, "loss": 0.2303, "lr": 1.0002841061765989e-06, "epoch": 2.4478028365496396, "percentage": 81.61, "elapsed_time": "4:04:14", "remaining_time": "0:55:02"}
1754
+ {"current_steps": 1754, "total_steps": 2148, "loss": 0.2343, "lr": 9.954130493808201e-07, "epoch": 2.449197860962567, "percentage": 81.66, "elapsed_time": "4:04:21", "remaining_time": "0:54:53"}
1755
+ {"current_steps": 1755, "total_steps": 2148, "loss": 0.2324, "lr": 9.905525703440815e-07, "epoch": 2.450592885375494, "percentage": 81.7, "elapsed_time": "4:04:28", "remaining_time": "0:54:44"}
1756
+ {"current_steps": 1756, "total_steps": 2148, "loss": 0.2128, "lr": 9.85702681904902e-07, "epoch": 2.4519879097884214, "percentage": 81.75, "elapsed_time": "4:04:39", "remaining_time": "0:54:37"}
1757
+ {"current_steps": 1757, "total_steps": 2148, "loss": 0.2389, "lr": 9.808633968738297e-07, "epoch": 2.4533829342013487, "percentage": 81.8, "elapsed_time": "4:04:46", "remaining_time": "0:54:28"}
1758
+ {"current_steps": 1758, "total_steps": 2148, "loss": 0.2539, "lr": 9.760347280334064e-07, "epoch": 2.454777958614276, "percentage": 81.84, "elapsed_time": "4:04:53", "remaining_time": "0:54:19"}
1759
+ {"current_steps": 1759, "total_steps": 2148, "loss": 0.2416, "lr": 9.712166881381279e-07, "epoch": 2.456172983027203, "percentage": 81.89, "elapsed_time": "4:05:00", "remaining_time": "0:54:10"}
1760
+ {"current_steps": 1760, "total_steps": 2148, "loss": 0.2459, "lr": 9.664092899144156e-07, "epoch": 2.45756800744013, "percentage": 81.94, "elapsed_time": "4:05:07", "remaining_time": "0:54:02"}
1761
+ {"current_steps": 1761, "total_steps": 2148, "loss": 0.219, "lr": 9.616125460605857e-07, "epoch": 2.4589630318530573, "percentage": 81.98, "elapsed_time": "4:05:15", "remaining_time": "0:53:53"}
1762
+ {"current_steps": 1762, "total_steps": 2148, "loss": 0.2164, "lr": 9.56826469246806e-07, "epoch": 2.4603580562659846, "percentage": 82.03, "elapsed_time": "4:05:24", "remaining_time": "0:53:45"}
1763
+ {"current_steps": 1763, "total_steps": 2148, "loss": 0.2205, "lr": 9.520510721150722e-07, "epoch": 2.461753080678912, "percentage": 82.08, "elapsed_time": "4:05:31", "remaining_time": "0:53:37"}
1764
+ {"current_steps": 1764, "total_steps": 2148, "loss": 0.2797, "lr": 9.472863672791721e-07, "epoch": 2.463148105091839, "percentage": 82.12, "elapsed_time": "4:05:39", "remaining_time": "0:53:28"}
1765
+ {"current_steps": 1765, "total_steps": 2148, "loss": 0.2311, "lr": 9.425323673246461e-07, "epoch": 2.4645431295047664, "percentage": 82.17, "elapsed_time": "4:05:48", "remaining_time": "0:53:20"}
1766
+ {"current_steps": 1766, "total_steps": 2148, "loss": 0.2422, "lr": 9.377890848087595e-07, "epoch": 2.4659381539176937, "percentage": 82.22, "elapsed_time": "4:05:54", "remaining_time": "0:53:11"}
1767
+ {"current_steps": 1767, "total_steps": 2148, "loss": 0.2557, "lr": 9.330565322604729e-07, "epoch": 2.467333178330621, "percentage": 82.26, "elapsed_time": "4:06:07", "remaining_time": "0:53:04"}
1768
+ {"current_steps": 1768, "total_steps": 2148, "loss": 0.2365, "lr": 9.283347221803985e-07, "epoch": 2.468728202743548, "percentage": 82.31, "elapsed_time": "4:06:14", "remaining_time": "0:52:55"}
1769
+ {"current_steps": 1769, "total_steps": 2148, "loss": 0.2611, "lr": 9.236236670407772e-07, "epoch": 2.470123227156475, "percentage": 82.36, "elapsed_time": "4:06:21", "remaining_time": "0:52:46"}
1770
+ {"current_steps": 1770, "total_steps": 2148, "loss": 0.2471, "lr": 9.189233792854424e-07, "epoch": 2.4715182515694023, "percentage": 82.4, "elapsed_time": "4:06:27", "remaining_time": "0:52:37"}
1771
+ {"current_steps": 1771, "total_steps": 2148, "loss": 0.2462, "lr": 9.142338713297838e-07, "epoch": 2.4729132759823296, "percentage": 82.45, "elapsed_time": "4:06:35", "remaining_time": "0:52:29"}
1772
+ {"current_steps": 1772, "total_steps": 2148, "loss": 0.2399, "lr": 9.095551555607169e-07, "epoch": 2.474308300395257, "percentage": 82.5, "elapsed_time": "4:06:43", "remaining_time": "0:52:21"}
1773
+ {"current_steps": 1773, "total_steps": 2148, "loss": 0.2505, "lr": 9.048872443366529e-07, "epoch": 2.475703324808184, "percentage": 82.54, "elapsed_time": "4:06:51", "remaining_time": "0:52:12"}
1774
+ {"current_steps": 1774, "total_steps": 2148, "loss": 0.2365, "lr": 9.002301499874622e-07, "epoch": 2.4770983492211114, "percentage": 82.59, "elapsed_time": "4:06:59", "remaining_time": "0:52:04"}
1775
+ {"current_steps": 1775, "total_steps": 2148, "loss": 0.2229, "lr": 8.955838848144449e-07, "epoch": 2.4784933736340387, "percentage": 82.64, "elapsed_time": "4:07:07", "remaining_time": "0:51:55"}
1776
+ {"current_steps": 1776, "total_steps": 2148, "loss": 0.2521, "lr": 8.909484610902958e-07, "epoch": 2.479888398046966, "percentage": 82.68, "elapsed_time": "4:07:17", "remaining_time": "0:51:47"}
1777
+ {"current_steps": 1777, "total_steps": 2148, "loss": 0.2096, "lr": 8.863238910590704e-07, "epoch": 2.481283422459893, "percentage": 82.73, "elapsed_time": "4:07:24", "remaining_time": "0:51:39"}
1778
+ {"current_steps": 1778, "total_steps": 2148, "loss": 0.2482, "lr": 8.817101869361599e-07, "epoch": 2.4826784468728205, "percentage": 82.77, "elapsed_time": "4:07:31", "remaining_time": "0:51:30"}
1779
+ {"current_steps": 1779, "total_steps": 2148, "loss": 0.2652, "lr": 8.77107360908253e-07, "epoch": 2.4840734712857477, "percentage": 82.82, "elapsed_time": "4:07:38", "remaining_time": "0:51:21"}
1780
+ {"current_steps": 1780, "total_steps": 2148, "loss": 0.2339, "lr": 8.725154251333012e-07, "epoch": 2.4854684956986746, "percentage": 82.87, "elapsed_time": "4:07:44", "remaining_time": "0:51:13"}
1781
+ {"current_steps": 1781, "total_steps": 2148, "loss": 0.2962, "lr": 8.679343917404959e-07, "epoch": 2.486863520111602, "percentage": 82.91, "elapsed_time": "4:07:57", "remaining_time": "0:51:05"}
1782
+ {"current_steps": 1782, "total_steps": 2148, "loss": 0.2409, "lr": 8.633642728302266e-07, "epoch": 2.488258544524529, "percentage": 82.96, "elapsed_time": "4:08:03", "remaining_time": "0:50:56"}
1783
+ {"current_steps": 1783, "total_steps": 2148, "loss": 0.226, "lr": 8.588050804740527e-07, "epoch": 2.4896535689374564, "percentage": 83.01, "elapsed_time": "4:08:12", "remaining_time": "0:50:48"}
1784
+ {"current_steps": 1784, "total_steps": 2148, "loss": 0.2163, "lr": 8.542568267146761e-07, "epoch": 2.4910485933503836, "percentage": 83.05, "elapsed_time": "4:08:21", "remaining_time": "0:50:40"}
1785
+ {"current_steps": 1785, "total_steps": 2148, "loss": 0.2184, "lr": 8.49719523565904e-07, "epoch": 2.492443617763311, "percentage": 83.1, "elapsed_time": "4:08:28", "remaining_time": "0:50:31"}
1786
+ {"current_steps": 1786, "total_steps": 2148, "loss": 0.2385, "lr": 8.451931830126148e-07, "epoch": 2.493838642176238, "percentage": 83.15, "elapsed_time": "4:08:36", "remaining_time": "0:50:23"}
1787
+ {"current_steps": 1787, "total_steps": 2148, "loss": 0.2222, "lr": 8.40677817010736e-07, "epoch": 2.4952336665891655, "percentage": 83.19, "elapsed_time": "4:08:48", "remaining_time": "0:50:15"}
1788
+ {"current_steps": 1788, "total_steps": 2148, "loss": 0.2424, "lr": 8.361734374872032e-07, "epoch": 2.4966286910020927, "percentage": 83.24, "elapsed_time": "4:08:55", "remaining_time": "0:50:07"}
1789
+ {"current_steps": 1789, "total_steps": 2148, "loss": 0.2252, "lr": 8.316800563399307e-07, "epoch": 2.4980237154150196, "percentage": 83.29, "elapsed_time": "4:09:02", "remaining_time": "0:49:58"}
1790
+ {"current_steps": 1790, "total_steps": 2148, "loss": 0.2155, "lr": 8.271976854377861e-07, "epoch": 2.499418739827947, "percentage": 83.33, "elapsed_time": "4:09:08", "remaining_time": "0:49:49"}
1791
+ {"current_steps": 1791, "total_steps": 2148, "loss": 0.264, "lr": 8.227263366205523e-07, "epoch": 2.500813764240874, "percentage": 83.38, "elapsed_time": "4:09:17", "remaining_time": "0:49:41"}
1792
+ {"current_steps": 1792, "total_steps": 2148, "loss": 0.3259, "lr": 8.182660216988964e-07, "epoch": 2.5022087886538014, "percentage": 83.43, "elapsed_time": "4:09:24", "remaining_time": "0:49:32"}
1793
+ {"current_steps": 1793, "total_steps": 2148, "loss": 0.2514, "lr": 8.138167524543445e-07, "epoch": 2.5036038130667286, "percentage": 83.47, "elapsed_time": "4:09:30", "remaining_time": "0:49:24"}
1794
+ {"current_steps": 1794, "total_steps": 2148, "loss": 0.2515, "lr": 8.09378540639243e-07, "epoch": 2.504998837479656, "percentage": 83.52, "elapsed_time": "4:09:41", "remaining_time": "0:49:16"}
1795
+ {"current_steps": 1795, "total_steps": 2148, "loss": 0.2479, "lr": 8.049513979767304e-07, "epoch": 2.506393861892583, "percentage": 83.57, "elapsed_time": "4:09:48", "remaining_time": "0:49:07"}
1796
+ {"current_steps": 1796, "total_steps": 2148, "loss": 0.2003, "lr": 8.00535336160711e-07, "epoch": 2.5077888863055104, "percentage": 83.61, "elapsed_time": "4:09:54", "remaining_time": "0:48:58"}
1797
+ {"current_steps": 1797, "total_steps": 2148, "loss": 0.2429, "lr": 7.96130366855819e-07, "epoch": 2.5091839107184377, "percentage": 83.66, "elapsed_time": "4:10:00", "remaining_time": "0:48:50"}
1798
+ {"current_steps": 1798, "total_steps": 2148, "loss": 0.2206, "lr": 7.917365016973866e-07, "epoch": 2.510578935131365, "percentage": 83.71, "elapsed_time": "4:10:07", "remaining_time": "0:48:41"}
1799
+ {"current_steps": 1799, "total_steps": 2148, "loss": 0.2506, "lr": 7.873537522914155e-07, "epoch": 2.5119739595442923, "percentage": 83.75, "elapsed_time": "4:10:16", "remaining_time": "0:48:33"}
1800
+ {"current_steps": 1800, "total_steps": 2148, "loss": 0.2345, "lr": 7.829821302145485e-07, "epoch": 2.5133689839572195, "percentage": 83.8, "elapsed_time": "4:10:23", "remaining_time": "0:48:24"}
1801
+ {"current_steps": 1801, "total_steps": 2148, "loss": 0.2365, "lr": 7.786216470140334e-07, "epoch": 2.5147640083701464, "percentage": 83.85, "elapsed_time": "4:10:30", "remaining_time": "0:48:15"}
1802
+ {"current_steps": 1802, "total_steps": 2148, "loss": 0.233, "lr": 7.742723142076991e-07, "epoch": 2.5161590327830736, "percentage": 83.89, "elapsed_time": "4:10:36", "remaining_time": "0:48:07"}
1803
+ {"current_steps": 1803, "total_steps": 2148, "loss": 0.2465, "lr": 7.699341432839203e-07, "epoch": 2.517554057196001, "percentage": 83.94, "elapsed_time": "4:10:43", "remaining_time": "0:47:58"}
1804
+ {"current_steps": 1804, "total_steps": 2148, "loss": 0.2094, "lr": 7.656071457015879e-07, "epoch": 2.518949081608928, "percentage": 83.99, "elapsed_time": "4:10:49", "remaining_time": "0:47:49"}
1805
+ {"current_steps": 1805, "total_steps": 2148, "loss": 0.2308, "lr": 7.612913328900784e-07, "epoch": 2.5203441060218554, "percentage": 84.03, "elapsed_time": "4:11:00", "remaining_time": "0:47:41"}
1806
+ {"current_steps": 1806, "total_steps": 2148, "loss": 0.2009, "lr": 7.569867162492283e-07, "epoch": 2.5217391304347827, "percentage": 84.08, "elapsed_time": "4:11:08", "remaining_time": "0:47:33"}
1807
+ {"current_steps": 1807, "total_steps": 2148, "loss": 0.2628, "lr": 7.526933071492959e-07, "epoch": 2.52313415484771, "percentage": 84.12, "elapsed_time": "4:11:20", "remaining_time": "0:47:25"}
1808
+ {"current_steps": 1808, "total_steps": 2148, "loss": 0.2267, "lr": 7.484111169309399e-07, "epoch": 2.524529179260637, "percentage": 84.17, "elapsed_time": "4:11:28", "remaining_time": "0:47:17"}
1809
+ {"current_steps": 1809, "total_steps": 2148, "loss": 0.2307, "lr": 7.441401569051848e-07, "epoch": 2.525924203673564, "percentage": 84.22, "elapsed_time": "4:11:40", "remaining_time": "0:47:09"}
1810
+ {"current_steps": 1810, "total_steps": 2148, "loss": 0.2172, "lr": 7.398804383533886e-07, "epoch": 2.5273192280864913, "percentage": 84.26, "elapsed_time": "4:11:46", "remaining_time": "0:47:01"}
1811
+ {"current_steps": 1811, "total_steps": 2148, "loss": 0.2354, "lr": 7.356319725272165e-07, "epoch": 2.5287142524994186, "percentage": 84.31, "elapsed_time": "4:11:53", "remaining_time": "0:46:52"}
1812
+ {"current_steps": 1812, "total_steps": 2148, "loss": 0.2439, "lr": 7.313947706486136e-07, "epoch": 2.530109276912346, "percentage": 84.36, "elapsed_time": "4:12:03", "remaining_time": "0:46:44"}
1813
+ {"current_steps": 1813, "total_steps": 2148, "loss": 0.2611, "lr": 7.271688439097713e-07, "epoch": 2.531504301325273, "percentage": 84.4, "elapsed_time": "4:12:13", "remaining_time": "0:46:36"}
1814
+ {"current_steps": 1814, "total_steps": 2148, "loss": 0.1908, "lr": 7.229542034730952e-07, "epoch": 2.5328993257382004, "percentage": 84.45, "elapsed_time": "4:12:19", "remaining_time": "0:46:27"}
1815
+ {"current_steps": 1815, "total_steps": 2148, "loss": 0.239, "lr": 7.187508604711851e-07, "epoch": 2.5342943501511277, "percentage": 84.5, "elapsed_time": "4:12:28", "remaining_time": "0:46:19"}
1816
+ {"current_steps": 1816, "total_steps": 2148, "loss": 0.2547, "lr": 7.145588260067943e-07, "epoch": 2.535689374564055, "percentage": 84.54, "elapsed_time": "4:12:37", "remaining_time": "0:46:11"}
1817
+ {"current_steps": 1817, "total_steps": 2148, "loss": 0.2386, "lr": 7.103781111528074e-07, "epoch": 2.5370843989769822, "percentage": 84.59, "elapsed_time": "4:12:47", "remaining_time": "0:46:03"}
1818
+ {"current_steps": 1818, "total_steps": 2148, "loss": 0.2083, "lr": 7.062087269522105e-07, "epoch": 2.5384794233899095, "percentage": 84.64, "elapsed_time": "4:12:54", "remaining_time": "0:45:54"}
1819
+ {"current_steps": 1819, "total_steps": 2148, "loss": 0.24, "lr": 7.020506844180608e-07, "epoch": 2.5398744478028368, "percentage": 84.68, "elapsed_time": "4:13:03", "remaining_time": "0:45:46"}
1820
+ {"current_steps": 1820, "total_steps": 2148, "loss": 0.2422, "lr": 6.979039945334543e-07, "epoch": 2.541269472215764, "percentage": 84.73, "elapsed_time": "4:13:09", "remaining_time": "0:45:37"}
1821
+ {"current_steps": 1821, "total_steps": 2148, "loss": 0.2353, "lr": 6.937686682515044e-07, "epoch": 2.542664496628691, "percentage": 84.78, "elapsed_time": "4:13:16", "remaining_time": "0:45:28"}
1822
+ {"current_steps": 1822, "total_steps": 2148, "loss": 0.2535, "lr": 6.896447164953057e-07, "epoch": 2.544059521041618, "percentage": 84.82, "elapsed_time": "4:13:23", "remaining_time": "0:45:20"}
1823
+ {"current_steps": 1823, "total_steps": 2148, "loss": 0.2345, "lr": 6.855321501579077e-07, "epoch": 2.5454545454545454, "percentage": 84.87, "elapsed_time": "4:13:33", "remaining_time": "0:45:12"}
1824
+ {"current_steps": 1824, "total_steps": 2148, "loss": 0.24, "lr": 6.814309801022873e-07, "epoch": 2.5468495698674727, "percentage": 84.92, "elapsed_time": "4:13:43", "remaining_time": "0:45:04"}
1825
+ {"current_steps": 1825, "total_steps": 2148, "loss": 0.2644, "lr": 6.77341217161322e-07, "epoch": 2.5482445942804, "percentage": 84.96, "elapsed_time": "4:13:50", "remaining_time": "0:44:55"}
1826
+ {"current_steps": 1826, "total_steps": 2148, "loss": 0.2187, "lr": 6.732628721377533e-07, "epoch": 2.5496396186933272, "percentage": 85.01, "elapsed_time": "4:13:56", "remaining_time": "0:44:46"}
1827
+ {"current_steps": 1827, "total_steps": 2148, "loss": 0.2894, "lr": 6.69195955804165e-07, "epoch": 2.5510346431062545, "percentage": 85.06, "elapsed_time": "4:14:03", "remaining_time": "0:44:38"}
1828
+ {"current_steps": 1828, "total_steps": 2148, "loss": 0.2351, "lr": 6.651404789029553e-07, "epoch": 2.5524296675191813, "percentage": 85.1, "elapsed_time": "4:14:13", "remaining_time": "0:44:30"}
1829
+ {"current_steps": 1829, "total_steps": 2148, "loss": 0.2367, "lr": 6.610964521463032e-07, "epoch": 2.5538246919321086, "percentage": 85.15, "elapsed_time": "4:14:23", "remaining_time": "0:44:22"}
1830
+ {"current_steps": 1830, "total_steps": 2148, "loss": 0.2136, "lr": 6.570638862161449e-07, "epoch": 2.555219716345036, "percentage": 85.2, "elapsed_time": "4:14:31", "remaining_time": "0:44:13"}
1831
+ {"current_steps": 1831, "total_steps": 2148, "loss": 0.2161, "lr": 6.530427917641447e-07, "epoch": 2.556614740757963, "percentage": 85.24, "elapsed_time": "4:14:39", "remaining_time": "0:44:05"}
1832
+ {"current_steps": 1832, "total_steps": 2148, "loss": 0.2535, "lr": 6.490331794116633e-07, "epoch": 2.5580097651708904, "percentage": 85.29, "elapsed_time": "4:14:46", "remaining_time": "0:43:56"}
1833
+ {"current_steps": 1833, "total_steps": 2148, "loss": 0.2094, "lr": 6.450350597497335e-07, "epoch": 2.5594047895838177, "percentage": 85.34, "elapsed_time": "4:14:53", "remaining_time": "0:43:48"}
1834
+ {"current_steps": 1834, "total_steps": 2148, "loss": 0.2517, "lr": 6.410484433390335e-07, "epoch": 2.560799813996745, "percentage": 85.38, "elapsed_time": "4:15:03", "remaining_time": "0:43:40"}
1835
+ {"current_steps": 1835, "total_steps": 2148, "loss": 0.2051, "lr": 6.370733407098517e-07, "epoch": 2.562194838409672, "percentage": 85.43, "elapsed_time": "4:15:13", "remaining_time": "0:43:32"}
1836
+ {"current_steps": 1836, "total_steps": 2148, "loss": 0.2411, "lr": 6.331097623620697e-07, "epoch": 2.5635898628225995, "percentage": 85.47, "elapsed_time": "4:15:23", "remaining_time": "0:43:24"}
1837
+ {"current_steps": 1837, "total_steps": 2148, "loss": 0.2229, "lr": 6.291577187651255e-07, "epoch": 2.5649848872355268, "percentage": 85.52, "elapsed_time": "4:15:30", "remaining_time": "0:43:15"}
1838
+ {"current_steps": 1838, "total_steps": 2148, "loss": 0.2405, "lr": 6.252172203579892e-07, "epoch": 2.566379911648454, "percentage": 85.57, "elapsed_time": "4:15:36", "remaining_time": "0:43:06"}
1839
+ {"current_steps": 1839, "total_steps": 2148, "loss": 0.2727, "lr": 6.212882775491352e-07, "epoch": 2.5677749360613813, "percentage": 85.61, "elapsed_time": "4:15:46", "remaining_time": "0:42:58"}
1840
+ {"current_steps": 1840, "total_steps": 2148, "loss": 0.2451, "lr": 6.173709007165158e-07, "epoch": 2.5691699604743086, "percentage": 85.66, "elapsed_time": "4:15:53", "remaining_time": "0:42:50"}
1841
+ {"current_steps": 1841, "total_steps": 2148, "loss": 0.2332, "lr": 6.134651002075315e-07, "epoch": 2.5705649848872354, "percentage": 85.71, "elapsed_time": "4:16:01", "remaining_time": "0:42:41"}
1842
+ {"current_steps": 1842, "total_steps": 2148, "loss": 0.2443, "lr": 6.095708863390065e-07, "epoch": 2.5719600093001627, "percentage": 85.75, "elapsed_time": "4:16:10", "remaining_time": "0:42:33"}
1843
+ {"current_steps": 1843, "total_steps": 2148, "loss": 0.2183, "lr": 6.056882693971605e-07, "epoch": 2.57335503371309, "percentage": 85.8, "elapsed_time": "4:16:18", "remaining_time": "0:42:24"}
1844
+ {"current_steps": 1844, "total_steps": 2148, "loss": 0.2642, "lr": 6.018172596375776e-07, "epoch": 2.574750058126017, "percentage": 85.85, "elapsed_time": "4:16:24", "remaining_time": "0:42:16"}
1845
+ {"current_steps": 1845, "total_steps": 2148, "loss": 0.2464, "lr": 5.979578672851843e-07, "epoch": 2.5761450825389445, "percentage": 85.89, "elapsed_time": "4:16:36", "remaining_time": "0:42:08"}
1846
+ {"current_steps": 1846, "total_steps": 2148, "loss": 0.222, "lr": 5.941101025342239e-07, "epoch": 2.5775401069518717, "percentage": 85.94, "elapsed_time": "4:16:45", "remaining_time": "0:42:00"}
1847
+ {"current_steps": 1847, "total_steps": 2148, "loss": 0.2893, "lr": 5.902739755482201e-07, "epoch": 2.578935131364799, "percentage": 85.99, "elapsed_time": "4:16:53", "remaining_time": "0:41:51"}
1848
+ {"current_steps": 1848, "total_steps": 2148, "loss": 0.2155, "lr": 5.864494964599615e-07, "epoch": 2.580330155777726, "percentage": 86.03, "elapsed_time": "4:16:59", "remaining_time": "0:41:43"}
1849
+ {"current_steps": 1849, "total_steps": 2148, "loss": 0.2356, "lr": 5.826366753714707e-07, "epoch": 2.581725180190653, "percentage": 86.08, "elapsed_time": "4:17:09", "remaining_time": "0:41:35"}
1850
+ {"current_steps": 1850, "total_steps": 2148, "loss": 0.2252, "lr": 5.788355223539698e-07, "epoch": 2.5831202046035804, "percentage": 86.13, "elapsed_time": "4:17:18", "remaining_time": "0:41:26"}
1851
+ {"current_steps": 1851, "total_steps": 2148, "loss": 0.221, "lr": 5.750460474478675e-07, "epoch": 2.5845152290165077, "percentage": 86.17, "elapsed_time": "4:17:25", "remaining_time": "0:41:18"}
1852
+ {"current_steps": 1852, "total_steps": 2148, "loss": 0.2277, "lr": 5.712682606627251e-07, "epoch": 2.585910253429435, "percentage": 86.22, "elapsed_time": "4:17:32", "remaining_time": "0:41:09"}
1853
+ {"current_steps": 1853, "total_steps": 2148, "loss": 0.2428, "lr": 5.675021719772262e-07, "epoch": 2.587305277842362, "percentage": 86.27, "elapsed_time": "4:17:43", "remaining_time": "0:41:01"}
1854
+ {"current_steps": 1854, "total_steps": 2148, "loss": 0.2221, "lr": 5.637477913391604e-07, "epoch": 2.5887003022552895, "percentage": 86.31, "elapsed_time": "4:17:49", "remaining_time": "0:40:53"}
1855
+ {"current_steps": 1855, "total_steps": 2148, "loss": 0.258, "lr": 5.600051286653884e-07, "epoch": 2.5900953266682167, "percentage": 86.36, "elapsed_time": "4:17:59", "remaining_time": "0:40:44"}
1856
+ {"current_steps": 1856, "total_steps": 2148, "loss": 0.2299, "lr": 5.562741938418187e-07, "epoch": 2.591490351081144, "percentage": 86.41, "elapsed_time": "4:18:05", "remaining_time": "0:40:36"}
1857
+ {"current_steps": 1857, "total_steps": 2148, "loss": 0.2349, "lr": 5.525549967233829e-07, "epoch": 2.5928853754940713, "percentage": 86.45, "elapsed_time": "4:18:12", "remaining_time": "0:40:27"}
1858
+ {"current_steps": 1858, "total_steps": 2148, "loss": 0.2325, "lr": 5.488475471340099e-07, "epoch": 2.5942803999069985, "percentage": 86.5, "elapsed_time": "4:18:20", "remaining_time": "0:40:19"}
1859
+ {"current_steps": 1859, "total_steps": 2148, "loss": 0.2428, "lr": 5.451518548665946e-07, "epoch": 2.595675424319926, "percentage": 86.55, "elapsed_time": "4:18:27", "remaining_time": "0:40:10"}
1860
+ {"current_steps": 1860, "total_steps": 2148, "loss": 0.2332, "lr": 5.414679296829806e-07, "epoch": 2.597070448732853, "percentage": 86.59, "elapsed_time": "4:18:33", "remaining_time": "0:40:02"}
1861
+ {"current_steps": 1861, "total_steps": 2148, "loss": 0.199, "lr": 5.377957813139262e-07, "epoch": 2.59846547314578, "percentage": 86.64, "elapsed_time": "4:18:41", "remaining_time": "0:39:53"}
1862
+ {"current_steps": 1862, "total_steps": 2148, "loss": 0.3003, "lr": 5.341354194590831e-07, "epoch": 2.599860497558707, "percentage": 86.69, "elapsed_time": "4:18:47", "remaining_time": "0:39:45"}
1863
+ {"current_steps": 1863, "total_steps": 2148, "loss": 0.2218, "lr": 5.304868537869706e-07, "epoch": 2.6012555219716345, "percentage": 86.73, "elapsed_time": "4:18:54", "remaining_time": "0:39:36"}
1864
+ {"current_steps": 1864, "total_steps": 2148, "loss": 0.228, "lr": 5.268500939349514e-07, "epoch": 2.6026505463845617, "percentage": 86.78, "elapsed_time": "4:19:01", "remaining_time": "0:39:27"}
1865
+ {"current_steps": 1865, "total_steps": 2148, "loss": 0.2143, "lr": 5.232251495091989e-07, "epoch": 2.604045570797489, "percentage": 86.82, "elapsed_time": "4:19:08", "remaining_time": "0:39:19"}
1866
+ {"current_steps": 1866, "total_steps": 2148, "loss": 0.2221, "lr": 5.196120300846835e-07, "epoch": 2.6054405952104163, "percentage": 86.87, "elapsed_time": "4:19:14", "remaining_time": "0:39:10"}
1867
+ {"current_steps": 1867, "total_steps": 2148, "loss": 0.2491, "lr": 5.160107452051361e-07, "epoch": 2.6068356196233435, "percentage": 86.92, "elapsed_time": "4:19:20", "remaining_time": "0:39:02"}
1868
+ {"current_steps": 1868, "total_steps": 2148, "loss": 0.2021, "lr": 5.124213043830278e-07, "epoch": 2.6082306440362704, "percentage": 86.96, "elapsed_time": "4:19:26", "remaining_time": "0:38:53"}
1869
+ {"current_steps": 1869, "total_steps": 2148, "loss": 0.2141, "lr": 5.088437170995481e-07, "epoch": 2.6096256684491976, "percentage": 87.01, "elapsed_time": "4:19:33", "remaining_time": "0:38:44"}
1870
+ {"current_steps": 1870, "total_steps": 2148, "loss": 0.2257, "lr": 5.052779928045737e-07, "epoch": 2.611020692862125, "percentage": 87.06, "elapsed_time": "4:19:39", "remaining_time": "0:38:36"}
1871
+ {"current_steps": 1871, "total_steps": 2148, "loss": 0.2341, "lr": 5.01724140916649e-07, "epoch": 2.612415717275052, "percentage": 87.1, "elapsed_time": "4:19:48", "remaining_time": "0:38:27"}
1872
+ {"current_steps": 1872, "total_steps": 2148, "loss": 0.2512, "lr": 4.981821708229545e-07, "epoch": 2.6138107416879794, "percentage": 87.15, "elapsed_time": "4:19:54", "remaining_time": "0:38:19"}
1873
+ {"current_steps": 1873, "total_steps": 2148, "loss": 0.2182, "lr": 4.946520918792886e-07, "epoch": 2.6152057661009067, "percentage": 87.2, "elapsed_time": "4:20:00", "remaining_time": "0:38:10"}
1874
+ {"current_steps": 1874, "total_steps": 2148, "loss": 0.2533, "lr": 4.911339134100401e-07, "epoch": 2.616600790513834, "percentage": 87.24, "elapsed_time": "4:20:08", "remaining_time": "0:38:02"}
1875
+ {"current_steps": 1875, "total_steps": 2148, "loss": 0.239, "lr": 4.87627644708163e-07, "epoch": 2.6179958149267613, "percentage": 87.29, "elapsed_time": "4:20:17", "remaining_time": "0:37:53"}
1876
+ {"current_steps": 1876, "total_steps": 2148, "loss": 0.2441, "lr": 4.841332950351535e-07, "epoch": 2.6193908393396885, "percentage": 87.34, "elapsed_time": "4:20:25", "remaining_time": "0:37:45"}
1877
+ {"current_steps": 1877, "total_steps": 2148, "loss": 0.2365, "lr": 4.806508736210253e-07, "epoch": 2.620785863752616, "percentage": 87.38, "elapsed_time": "4:20:36", "remaining_time": "0:37:37"}
1878
+ {"current_steps": 1878, "total_steps": 2148, "loss": 0.2165, "lr": 4.771803896642812e-07, "epoch": 2.622180888165543, "percentage": 87.43, "elapsed_time": "4:20:50", "remaining_time": "0:37:30"}
1879
+ {"current_steps": 1879, "total_steps": 2148, "loss": 0.2542, "lr": 4.737218523318965e-07, "epoch": 2.6235759125784703, "percentage": 87.48, "elapsed_time": "4:20:56", "remaining_time": "0:37:21"}
1880
+ {"current_steps": 1880, "total_steps": 2148, "loss": 0.2212, "lr": 4.7027527075929e-07, "epoch": 2.6249709369913976, "percentage": 87.52, "elapsed_time": "4:21:03", "remaining_time": "0:37:12"}
1881
+ {"current_steps": 1881, "total_steps": 2148, "loss": 0.2363, "lr": 4.6684065405029677e-07, "epoch": 2.6263659614043244, "percentage": 87.57, "elapsed_time": "4:21:09", "remaining_time": "0:37:04"}
1882
+ {"current_steps": 1882, "total_steps": 2148, "loss": 0.2257, "lr": 4.6341801127715303e-07, "epoch": 2.6277609858172517, "percentage": 87.62, "elapsed_time": "4:21:16", "remaining_time": "0:36:55"}
1883
+ {"current_steps": 1883, "total_steps": 2148, "loss": 0.2529, "lr": 4.6000735148046316e-07, "epoch": 2.629156010230179, "percentage": 87.66, "elapsed_time": "4:21:27", "remaining_time": "0:36:47"}
1884
+ {"current_steps": 1884, "total_steps": 2148, "loss": 0.2275, "lr": 4.566086836691791e-07, "epoch": 2.6305510346431062, "percentage": 87.71, "elapsed_time": "4:21:34", "remaining_time": "0:36:39"}
1885
+ {"current_steps": 1885, "total_steps": 2148, "loss": 0.24, "lr": 4.532220168205798e-07, "epoch": 2.6319460590560335, "percentage": 87.76, "elapsed_time": "4:21:40", "remaining_time": "0:36:30"}
1886
+ {"current_steps": 1886, "total_steps": 2148, "loss": 0.2085, "lr": 4.498473598802444e-07, "epoch": 2.633341083468961, "percentage": 87.8, "elapsed_time": "4:21:50", "remaining_time": "0:36:22"}
1887
+ {"current_steps": 1887, "total_steps": 2148, "loss": 0.2322, "lr": 4.464847217620266e-07, "epoch": 2.634736107881888, "percentage": 87.85, "elapsed_time": "4:21:58", "remaining_time": "0:36:14"}
1888
+ {"current_steps": 1888, "total_steps": 2148, "loss": 0.2464, "lr": 4.4313411134803584e-07, "epoch": 2.636131132294815, "percentage": 87.9, "elapsed_time": "4:22:04", "remaining_time": "0:36:05"}
1889
+ {"current_steps": 1889, "total_steps": 2148, "loss": 0.2192, "lr": 4.397955374886104e-07, "epoch": 2.637526156707742, "percentage": 87.94, "elapsed_time": "4:22:17", "remaining_time": "0:35:57"}
1890
+ {"current_steps": 1890, "total_steps": 2148, "loss": 0.2369, "lr": 4.364690090022938e-07, "epoch": 2.6389211811206694, "percentage": 87.99, "elapsed_time": "4:22:26", "remaining_time": "0:35:49"}
1891
+ {"current_steps": 1891, "total_steps": 2148, "loss": 0.2322, "lr": 4.331545346758159e-07, "epoch": 2.6403162055335967, "percentage": 88.04, "elapsed_time": "4:22:40", "remaining_time": "0:35:41"}
1892
+ {"current_steps": 1892, "total_steps": 2148, "loss": 0.2121, "lr": 4.2985212326406456e-07, "epoch": 2.641711229946524, "percentage": 88.08, "elapsed_time": "4:22:47", "remaining_time": "0:35:33"}
1893
+ {"current_steps": 1893, "total_steps": 2148, "loss": 0.2134, "lr": 4.265617834900637e-07, "epoch": 2.6431062543594512, "percentage": 88.13, "elapsed_time": "4:22:58", "remaining_time": "0:35:25"}
1894
+ {"current_steps": 1894, "total_steps": 2148, "loss": 0.2035, "lr": 4.2328352404495346e-07, "epoch": 2.6445012787723785, "percentage": 88.18, "elapsed_time": "4:23:04", "remaining_time": "0:35:16"}
1895
+ {"current_steps": 1895, "total_steps": 2148, "loss": 0.2007, "lr": 4.2001735358796316e-07, "epoch": 2.6458963031853058, "percentage": 88.22, "elapsed_time": "4:23:12", "remaining_time": "0:35:08"}
1896
+ {"current_steps": 1896, "total_steps": 2148, "loss": 0.2022, "lr": 4.167632807463895e-07, "epoch": 2.647291327598233, "percentage": 88.27, "elapsed_time": "4:23:25", "remaining_time": "0:35:00"}
1897
+ {"current_steps": 1897, "total_steps": 2148, "loss": 0.2296, "lr": 4.135213141155769e-07, "epoch": 2.6486863520111603, "percentage": 88.31, "elapsed_time": "4:23:32", "remaining_time": "0:34:52"}
1898
+ {"current_steps": 1898, "total_steps": 2148, "loss": 0.2356, "lr": 4.1029146225889103e-07, "epoch": 2.6500813764240876, "percentage": 88.36, "elapsed_time": "4:23:39", "remaining_time": "0:34:43"}
1899
+ {"current_steps": 1899, "total_steps": 2148, "loss": 0.2321, "lr": 4.0707373370769634e-07, "epoch": 2.651476400837015, "percentage": 88.41, "elapsed_time": "4:23:46", "remaining_time": "0:34:35"}
1900
+ {"current_steps": 1900, "total_steps": 2148, "loss": 0.2363, "lr": 4.0386813696133564e-07, "epoch": 2.652871425249942, "percentage": 88.45, "elapsed_time": "4:23:52", "remaining_time": "0:34:26"}
1901
+ {"current_steps": 1901, "total_steps": 2148, "loss": 0.2194, "lr": 4.0067468048710756e-07, "epoch": 2.654266449662869, "percentage": 88.5, "elapsed_time": "4:24:00", "remaining_time": "0:34:18"}
1902
+ {"current_steps": 1902, "total_steps": 2148, "loss": 0.229, "lr": 3.974933727202412e-07, "epoch": 2.6556614740757962, "percentage": 88.55, "elapsed_time": "4:24:07", "remaining_time": "0:34:09"}
1903
+ {"current_steps": 1903, "total_steps": 2148, "loss": 0.2152, "lr": 3.943242220638777e-07, "epoch": 2.6570564984887235, "percentage": 88.59, "elapsed_time": "4:24:16", "remaining_time": "0:34:01"}
1904
+ {"current_steps": 1904, "total_steps": 2148, "loss": 0.2426, "lr": 3.911672368890462e-07, "epoch": 2.6584515229016508, "percentage": 88.64, "elapsed_time": "4:24:22", "remaining_time": "0:33:52"}
1905
+ {"current_steps": 1905, "total_steps": 2148, "loss": 0.2313, "lr": 3.8802242553464096e-07, "epoch": 2.659846547314578, "percentage": 88.69, "elapsed_time": "4:24:29", "remaining_time": "0:33:44"}
1906
+ {"current_steps": 1906, "total_steps": 2148, "loss": 0.2298, "lr": 3.8488979630739996e-07, "epoch": 2.6612415717275053, "percentage": 88.73, "elapsed_time": "4:24:40", "remaining_time": "0:33:36"}
1907
+ {"current_steps": 1907, "total_steps": 2148, "loss": 0.1858, "lr": 3.8176935748188425e-07, "epoch": 2.6626365961404326, "percentage": 88.78, "elapsed_time": "4:24:52", "remaining_time": "0:33:28"}
1908
+ {"current_steps": 1908, "total_steps": 2148, "loss": 0.207, "lr": 3.78661117300454e-07, "epoch": 2.66403162055336, "percentage": 88.83, "elapsed_time": "4:25:01", "remaining_time": "0:33:20"}
1909
+ {"current_steps": 1909, "total_steps": 2148, "loss": 0.2123, "lr": 3.755650839732489e-07, "epoch": 2.6654266449662867, "percentage": 88.87, "elapsed_time": "4:25:08", "remaining_time": "0:33:11"}
1910
+ {"current_steps": 1910, "total_steps": 2148, "loss": 0.2562, "lr": 3.7248126567816454e-07, "epoch": 2.666821669379214, "percentage": 88.92, "elapsed_time": "4:25:14", "remaining_time": "0:33:03"}
1911
+ {"current_steps": 1911, "total_steps": 2148, "loss": 0.2368, "lr": 3.694096705608319e-07, "epoch": 2.668216693792141, "percentage": 88.97, "elapsed_time": "4:25:24", "remaining_time": "0:32:54"}
1912
+ {"current_steps": 1912, "total_steps": 2148, "loss": 0.2218, "lr": 3.6635030673459413e-07, "epoch": 2.6696117182050685, "percentage": 89.01, "elapsed_time": "4:25:33", "remaining_time": "0:32:46"}
1913
+ {"current_steps": 1913, "total_steps": 2148, "loss": 0.2468, "lr": 3.6330318228049e-07, "epoch": 2.6710067426179958, "percentage": 89.06, "elapsed_time": "4:25:40", "remaining_time": "0:32:38"}
1914
+ {"current_steps": 1914, "total_steps": 2148, "loss": 0.2407, "lr": 3.6026830524722443e-07, "epoch": 2.672401767030923, "percentage": 89.11, "elapsed_time": "4:25:47", "remaining_time": "0:32:29"}
1915
+ {"current_steps": 1915, "total_steps": 2148, "loss": 0.2458, "lr": 3.572456836511551e-07, "epoch": 2.6737967914438503, "percentage": 89.15, "elapsed_time": "4:25:59", "remaining_time": "0:32:21"}
1916
+ {"current_steps": 1916, "total_steps": 2148, "loss": 0.2207, "lr": 3.5423532547626816e-07, "epoch": 2.6751918158567776, "percentage": 89.2, "elapsed_time": "4:26:07", "remaining_time": "0:32:13"}
1917
+ {"current_steps": 1917, "total_steps": 2148, "loss": 0.1981, "lr": 3.5123723867415527e-07, "epoch": 2.676586840269705, "percentage": 89.25, "elapsed_time": "4:26:17", "remaining_time": "0:32:05"}
1918
+ {"current_steps": 1918, "total_steps": 2148, "loss": 0.2194, "lr": 3.4825143116399454e-07, "epoch": 2.677981864682632, "percentage": 89.29, "elapsed_time": "4:26:24", "remaining_time": "0:31:56"}
1919
+ {"current_steps": 1919, "total_steps": 2148, "loss": 0.2209, "lr": 3.452779108325316e-07, "epoch": 2.6793768890955594, "percentage": 89.34, "elapsed_time": "4:26:30", "remaining_time": "0:31:48"}
1920
+ {"current_steps": 1920, "total_steps": 2148, "loss": 0.222, "lr": 3.4231668553405316e-07, "epoch": 2.6807719135084866, "percentage": 89.39, "elapsed_time": "4:26:36", "remaining_time": "0:31:39"}
1921
+ {"current_steps": 1921, "total_steps": 2148, "loss": 0.237, "lr": 3.39367763090373e-07, "epoch": 2.6821669379214135, "percentage": 89.43, "elapsed_time": "4:26:43", "remaining_time": "0:31:31"}
1922
+ {"current_steps": 1922, "total_steps": 2148, "loss": 0.238, "lr": 3.3643115129080695e-07, "epoch": 2.6835619623343407, "percentage": 89.48, "elapsed_time": "4:26:52", "remaining_time": "0:31:22"}
1923
+ {"current_steps": 1923, "total_steps": 2148, "loss": 0.2264, "lr": 3.3350685789215133e-07, "epoch": 2.684956986747268, "percentage": 89.53, "elapsed_time": "4:27:04", "remaining_time": "0:31:14"}
1924
+ {"current_steps": 1924, "total_steps": 2148, "loss": 0.2447, "lr": 3.3059489061866625e-07, "epoch": 2.6863520111601953, "percentage": 89.57, "elapsed_time": "4:27:12", "remaining_time": "0:31:06"}
1925
+ {"current_steps": 1925, "total_steps": 2148, "loss": 0.2521, "lr": 3.276952571620556e-07, "epoch": 2.6877470355731226, "percentage": 89.62, "elapsed_time": "4:27:24", "remaining_time": "0:30:58"}
1926
+ {"current_steps": 1926, "total_steps": 2148, "loss": 0.2302, "lr": 3.248079651814395e-07, "epoch": 2.68914205998605, "percentage": 89.66, "elapsed_time": "4:27:31", "remaining_time": "0:30:50"}
1927
+ {"current_steps": 1927, "total_steps": 2148, "loss": 0.1955, "lr": 3.2193302230334455e-07, "epoch": 2.690537084398977, "percentage": 89.71, "elapsed_time": "4:27:38", "remaining_time": "0:30:41"}
1928
+ {"current_steps": 1928, "total_steps": 2148, "loss": 0.2122, "lr": 3.190704361216751e-07, "epoch": 2.6919321088119044, "percentage": 89.76, "elapsed_time": "4:27:44", "remaining_time": "0:30:33"}
1929
+ {"current_steps": 1929, "total_steps": 2148, "loss": 0.266, "lr": 3.162202141976956e-07, "epoch": 2.693327133224831, "percentage": 89.8, "elapsed_time": "4:27:52", "remaining_time": "0:30:24"}
1930
+ {"current_steps": 1930, "total_steps": 2148, "loss": 0.2578, "lr": 3.133823640600137e-07, "epoch": 2.6947221576377585, "percentage": 89.85, "elapsed_time": "4:27:59", "remaining_time": "0:30:16"}
1931
+ {"current_steps": 1931, "total_steps": 2148, "loss": 0.2494, "lr": 3.105568932045577e-07, "epoch": 2.6961171820506857, "percentage": 89.9, "elapsed_time": "4:28:07", "remaining_time": "0:30:07"}
1932
+ {"current_steps": 1932, "total_steps": 2148, "loss": 0.2233, "lr": 3.077438090945573e-07, "epoch": 2.697512206463613, "percentage": 89.94, "elapsed_time": "4:28:13", "remaining_time": "0:29:59"}
1933
+ {"current_steps": 1933, "total_steps": 2148, "loss": 0.2472, "lr": 3.0494311916052234e-07, "epoch": 2.6989072308765403, "percentage": 89.99, "elapsed_time": "4:28:21", "remaining_time": "0:29:50"}
1934
+ {"current_steps": 1934, "total_steps": 2148, "loss": 0.2454, "lr": 3.021548308002248e-07, "epoch": 2.7003022552894675, "percentage": 90.04, "elapsed_time": "4:28:32", "remaining_time": "0:29:42"}
1935
+ {"current_steps": 1935, "total_steps": 2148, "loss": 0.2334, "lr": 2.9937895137868046e-07, "epoch": 2.701697279702395, "percentage": 90.08, "elapsed_time": "4:28:38", "remaining_time": "0:29:34"}
1936
+ {"current_steps": 1936, "total_steps": 2148, "loss": 0.2145, "lr": 2.9661548822812636e-07, "epoch": 2.703092304115322, "percentage": 90.13, "elapsed_time": "4:28:46", "remaining_time": "0:29:25"}
1937
+ {"current_steps": 1937, "total_steps": 2148, "loss": 0.2533, "lr": 2.9386444864800355e-07, "epoch": 2.7044873285282494, "percentage": 90.18, "elapsed_time": "4:28:52", "remaining_time": "0:29:17"}
1938
+ {"current_steps": 1938, "total_steps": 2148, "loss": 0.2681, "lr": 2.911258399049394e-07, "epoch": 2.7058823529411766, "percentage": 90.22, "elapsed_time": "4:29:00", "remaining_time": "0:29:08"}
1939
+ {"current_steps": 1939, "total_steps": 2148, "loss": 0.2283, "lr": 2.8839966923272286e-07, "epoch": 2.707277377354104, "percentage": 90.27, "elapsed_time": "4:29:07", "remaining_time": "0:29:00"}
1940
+ {"current_steps": 1940, "total_steps": 2148, "loss": 0.2516, "lr": 2.8568594383229067e-07, "epoch": 2.708672401767031, "percentage": 90.32, "elapsed_time": "4:29:15", "remaining_time": "0:28:52"}
1941
+ {"current_steps": 1941, "total_steps": 2148, "loss": 0.2544, "lr": 2.8298467087170655e-07, "epoch": 2.710067426179958, "percentage": 90.36, "elapsed_time": "4:29:22", "remaining_time": "0:28:43"}
1942
+ {"current_steps": 1942, "total_steps": 2148, "loss": 0.2399, "lr": 2.8029585748614196e-07, "epoch": 2.7114624505928853, "percentage": 90.41, "elapsed_time": "4:29:28", "remaining_time": "0:28:35"}
1943
+ {"current_steps": 1943, "total_steps": 2148, "loss": 0.242, "lr": 2.7761951077785676e-07, "epoch": 2.7128574750058125, "percentage": 90.46, "elapsed_time": "4:29:35", "remaining_time": "0:28:26"}
1944
+ {"current_steps": 1944, "total_steps": 2148, "loss": 0.2226, "lr": 2.749556378161833e-07, "epoch": 2.71425249941874, "percentage": 90.5, "elapsed_time": "4:29:47", "remaining_time": "0:28:18"}
1945
+ {"current_steps": 1945, "total_steps": 2148, "loss": 0.2224, "lr": 2.723042456375036e-07, "epoch": 2.715647523831667, "percentage": 90.55, "elapsed_time": "4:29:54", "remaining_time": "0:28:10"}
1946
+ {"current_steps": 1946, "total_steps": 2148, "loss": 0.2256, "lr": 2.696653412452327e-07, "epoch": 2.7170425482445943, "percentage": 90.6, "elapsed_time": "4:30:00", "remaining_time": "0:28:01"}
1947
+ {"current_steps": 1947, "total_steps": 2148, "loss": 0.2318, "lr": 2.6703893160980266e-07, "epoch": 2.7184375726575216, "percentage": 90.64, "elapsed_time": "4:30:07", "remaining_time": "0:27:53"}
1948
+ {"current_steps": 1948, "total_steps": 2148, "loss": 0.2466, "lr": 2.6442502366863854e-07, "epoch": 2.719832597070449, "percentage": 90.69, "elapsed_time": "4:30:13", "remaining_time": "0:27:44"}
1949
+ {"current_steps": 1949, "total_steps": 2148, "loss": 0.2324, "lr": 2.618236243261452e-07, "epoch": 2.7212276214833757, "percentage": 90.74, "elapsed_time": "4:30:20", "remaining_time": "0:27:36"}
1950
+ {"current_steps": 1950, "total_steps": 2148, "loss": 0.2329, "lr": 2.592347404536888e-07, "epoch": 2.722622645896303, "percentage": 90.78, "elapsed_time": "4:30:27", "remaining_time": "0:27:27"}
1951
+ {"current_steps": 1951, "total_steps": 2148, "loss": 0.2358, "lr": 2.566583788895721e-07, "epoch": 2.7240176703092303, "percentage": 90.83, "elapsed_time": "4:30:33", "remaining_time": "0:27:19"}
1952
+ {"current_steps": 1952, "total_steps": 2148, "loss": 0.2383, "lr": 2.5409454643902543e-07, "epoch": 2.7254126947221575, "percentage": 90.88, "elapsed_time": "4:30:39", "remaining_time": "0:27:10"}
1953
+ {"current_steps": 1953, "total_steps": 2148, "loss": 0.2428, "lr": 2.5154324987418434e-07, "epoch": 2.726807719135085, "percentage": 90.92, "elapsed_time": "4:30:45", "remaining_time": "0:27:02"}
1954
+ {"current_steps": 1954, "total_steps": 2148, "loss": 0.2235, "lr": 2.4900449593406984e-07, "epoch": 2.728202743548012, "percentage": 90.97, "elapsed_time": "4:30:52", "remaining_time": "0:26:53"}
1955
+ {"current_steps": 1955, "total_steps": 2148, "loss": 0.2263, "lr": 2.4647829132457446e-07, "epoch": 2.7295977679609393, "percentage": 91.01, "elapsed_time": "4:31:02", "remaining_time": "0:26:45"}
1956
+ {"current_steps": 1956, "total_steps": 2148, "loss": 0.2199, "lr": 2.439646427184428e-07, "epoch": 2.7309927923738666, "percentage": 91.06, "elapsed_time": "4:31:13", "remaining_time": "0:26:37"}
1957
+ {"current_steps": 1957, "total_steps": 2148, "loss": 0.2324, "lr": 2.4146355675525145e-07, "epoch": 2.732387816786794, "percentage": 91.11, "elapsed_time": "4:31:20", "remaining_time": "0:26:28"}
1958
+ {"current_steps": 1958, "total_steps": 2148, "loss": 0.2493, "lr": 2.389750400413965e-07, "epoch": 2.733782841199721, "percentage": 91.15, "elapsed_time": "4:31:29", "remaining_time": "0:26:20"}
1959
+ {"current_steps": 1959, "total_steps": 2148, "loss": 0.2276, "lr": 2.364990991500743e-07, "epoch": 2.7351778656126484, "percentage": 91.2, "elapsed_time": "4:31:38", "remaining_time": "0:26:12"}
1960
+ {"current_steps": 1960, "total_steps": 2148, "loss": 0.2066, "lr": 2.340357406212601e-07, "epoch": 2.7365728900255757, "percentage": 91.25, "elapsed_time": "4:31:44", "remaining_time": "0:26:03"}
1961
+ {"current_steps": 1961, "total_steps": 2148, "loss": 0.1987, "lr": 2.315849709616963e-07, "epoch": 2.7379679144385025, "percentage": 91.29, "elapsed_time": "4:31:50", "remaining_time": "0:25:55"}
1962
+ {"current_steps": 1962, "total_steps": 2148, "loss": 0.1947, "lr": 2.2914679664487237e-07, "epoch": 2.73936293885143, "percentage": 91.34, "elapsed_time": "4:31:58", "remaining_time": "0:25:47"}
1963
+ {"current_steps": 1963, "total_steps": 2148, "loss": 0.2357, "lr": 2.2672122411100727e-07, "epoch": 2.740757963264357, "percentage": 91.39, "elapsed_time": "4:32:04", "remaining_time": "0:25:38"}
1964
+ {"current_steps": 1964, "total_steps": 2148, "loss": 0.2226, "lr": 2.2430825976703485e-07, "epoch": 2.7421529876772843, "percentage": 91.43, "elapsed_time": "4:32:16", "remaining_time": "0:25:30"}
1965
+ {"current_steps": 1965, "total_steps": 2148, "loss": 0.2651, "lr": 2.2190790998658561e-07, "epoch": 2.7435480120902116, "percentage": 91.48, "elapsed_time": "4:32:23", "remaining_time": "0:25:22"}
1966
+ {"current_steps": 1966, "total_steps": 2148, "loss": 0.2186, "lr": 2.1952018110996843e-07, "epoch": 2.744943036503139, "percentage": 91.53, "elapsed_time": "4:32:29", "remaining_time": "0:25:13"}
1967
+ {"current_steps": 1967, "total_steps": 2148, "loss": 0.2523, "lr": 2.1714507944415708e-07, "epoch": 2.746338060916066, "percentage": 91.57, "elapsed_time": "4:32:39", "remaining_time": "0:25:05"}
1968
+ {"current_steps": 1968, "total_steps": 2148, "loss": 0.2196, "lr": 2.1478261126276989e-07, "epoch": 2.7477330853289934, "percentage": 91.62, "elapsed_time": "4:32:52", "remaining_time": "0:24:57"}
1969
+ {"current_steps": 1969, "total_steps": 2148, "loss": 0.2388, "lr": 2.1243278280605517e-07, "epoch": 2.7491281097419202, "percentage": 91.67, "elapsed_time": "4:33:02", "remaining_time": "0:24:49"}
1970
+ {"current_steps": 1970, "total_steps": 2148, "loss": 0.2187, "lr": 2.1009560028087627e-07, "epoch": 2.7505231341548475, "percentage": 91.71, "elapsed_time": "4:33:11", "remaining_time": "0:24:41"}
1971
+ {"current_steps": 1971, "total_steps": 2148, "loss": 0.2341, "lr": 2.0777106986069162e-07, "epoch": 2.7519181585677748, "percentage": 91.76, "elapsed_time": "4:33:21", "remaining_time": "0:24:32"}
1972
+ {"current_steps": 1972, "total_steps": 2148, "loss": 0.2139, "lr": 2.0545919768554078e-07, "epoch": 2.753313182980702, "percentage": 91.81, "elapsed_time": "4:33:28", "remaining_time": "0:24:24"}
1973
+ {"current_steps": 1973, "total_steps": 2148, "loss": 0.2503, "lr": 2.0315998986202902e-07, "epoch": 2.7547082073936293, "percentage": 91.85, "elapsed_time": "4:33:36", "remaining_time": "0:24:16"}
1974
+ {"current_steps": 1974, "total_steps": 2148, "loss": 0.2273, "lr": 2.0087345246330714e-07, "epoch": 2.7561032318065566, "percentage": 91.9, "elapsed_time": "4:33:43", "remaining_time": "0:24:07"}
1975
+ {"current_steps": 1975, "total_steps": 2148, "loss": 0.2365, "lr": 1.985995915290595e-07, "epoch": 2.757498256219484, "percentage": 91.95, "elapsed_time": "4:33:50", "remaining_time": "0:23:59"}
1976
+ {"current_steps": 1976, "total_steps": 2148, "loss": 0.2116, "lr": 1.9633841306548717e-07, "epoch": 2.758893280632411, "percentage": 91.99, "elapsed_time": "4:33:58", "remaining_time": "0:23:50"}
1977
+ {"current_steps": 1977, "total_steps": 2148, "loss": 0.2496, "lr": 1.9408992304529252e-07, "epoch": 2.7602883050453384, "percentage": 92.04, "elapsed_time": "4:34:14", "remaining_time": "0:23:43"}
1978
+ {"current_steps": 1978, "total_steps": 2148, "loss": 0.1972, "lr": 1.9185412740765962e-07, "epoch": 2.7616833294582657, "percentage": 92.09, "elapsed_time": "4:34:25", "remaining_time": "0:23:35"}
1979
+ {"current_steps": 1979, "total_steps": 2148, "loss": 0.223, "lr": 1.8963103205824397e-07, "epoch": 2.763078353871193, "percentage": 92.13, "elapsed_time": "4:34:31", "remaining_time": "0:23:26"}
1980
+ {"current_steps": 1980, "total_steps": 2148, "loss": 0.2364, "lr": 1.8742064286915329e-07, "epoch": 2.76447337828412, "percentage": 92.18, "elapsed_time": "4:34:38", "remaining_time": "0:23:18"}
1981
+ {"current_steps": 1981, "total_steps": 2148, "loss": 0.249, "lr": 1.8522296567893282e-07, "epoch": 2.765868402697047, "percentage": 92.23, "elapsed_time": "4:34:46", "remaining_time": "0:23:09"}
1982
+ {"current_steps": 1982, "total_steps": 2148, "loss": 0.2226, "lr": 1.830380062925513e-07, "epoch": 2.7672634271099743, "percentage": 92.27, "elapsed_time": "4:34:52", "remaining_time": "0:23:01"}
1983
+ {"current_steps": 1983, "total_steps": 2148, "loss": 0.2366, "lr": 1.8086577048138432e-07, "epoch": 2.7686584515229016, "percentage": 92.32, "elapsed_time": "4:34:58", "remaining_time": "0:22:52"}
1984
+ {"current_steps": 1984, "total_steps": 2148, "loss": 0.2195, "lr": 1.787062639831988e-07, "epoch": 2.770053475935829, "percentage": 92.36, "elapsed_time": "4:35:05", "remaining_time": "0:22:44"}
1985
+ {"current_steps": 1985, "total_steps": 2148, "loss": 0.2158, "lr": 1.7655949250213743e-07, "epoch": 2.771448500348756, "percentage": 92.41, "elapsed_time": "4:35:13", "remaining_time": "0:22:35"}
1986
+ {"current_steps": 1986, "total_steps": 2148, "loss": 0.2227, "lr": 1.7442546170870654e-07, "epoch": 2.7728435247616834, "percentage": 92.46, "elapsed_time": "4:35:20", "remaining_time": "0:22:27"}
1987
+ {"current_steps": 1987, "total_steps": 2148, "loss": 0.2392, "lr": 1.7230417723975766e-07, "epoch": 2.7742385491746107, "percentage": 92.5, "elapsed_time": "4:35:30", "remaining_time": "0:22:19"}
1988
+ {"current_steps": 1988, "total_steps": 2148, "loss": 0.2143, "lr": 1.7019564469847372e-07, "epoch": 2.775633573587538, "percentage": 92.55, "elapsed_time": "4:35:40", "remaining_time": "0:22:11"}
1989
+ {"current_steps": 1989, "total_steps": 2148, "loss": 0.2052, "lr": 1.6809986965435675e-07, "epoch": 2.7770285980004648, "percentage": 92.6, "elapsed_time": "4:35:46", "remaining_time": "0:22:02"}
1990
+ {"current_steps": 1990, "total_steps": 2148, "loss": 0.2435, "lr": 1.660168576432092e-07, "epoch": 2.778423622413392, "percentage": 92.64, "elapsed_time": "4:35:57", "remaining_time": "0:21:54"}
1991
+ {"current_steps": 1991, "total_steps": 2148, "loss": 0.2229, "lr": 1.6394661416711977e-07, "epoch": 2.7798186468263193, "percentage": 92.69, "elapsed_time": "4:36:07", "remaining_time": "0:21:46"}
1992
+ {"current_steps": 1992, "total_steps": 2148, "loss": 0.2236, "lr": 1.6188914469445372e-07, "epoch": 2.7812136712392466, "percentage": 92.74, "elapsed_time": "4:36:15", "remaining_time": "0:21:38"}
1993
+ {"current_steps": 1993, "total_steps": 2148, "loss": 0.2337, "lr": 1.5984445465983156e-07, "epoch": 2.782608695652174, "percentage": 92.78, "elapsed_time": "4:36:23", "remaining_time": "0:21:29"}
1994
+ {"current_steps": 1994, "total_steps": 2148, "loss": 0.2174, "lr": 1.5781254946412029e-07, "epoch": 2.784003720065101, "percentage": 92.83, "elapsed_time": "4:36:29", "remaining_time": "0:21:21"}
1995
+ {"current_steps": 1995, "total_steps": 2148, "loss": 0.216, "lr": 1.5579343447441663e-07, "epoch": 2.7853987444780284, "percentage": 92.88, "elapsed_time": "4:36:40", "remaining_time": "0:21:13"}
1996
+ {"current_steps": 1996, "total_steps": 2148, "loss": 0.192, "lr": 1.5378711502403164e-07, "epoch": 2.7867937688909556, "percentage": 92.92, "elapsed_time": "4:36:46", "remaining_time": "0:21:04"}
1997
+ {"current_steps": 1997, "total_steps": 2148, "loss": 0.2368, "lr": 1.5179359641247948e-07, "epoch": 2.788188793303883, "percentage": 92.97, "elapsed_time": "4:36:53", "remaining_time": "0:20:56"}
1998
+ {"current_steps": 1998, "total_steps": 2148, "loss": 0.2447, "lr": 1.4981288390546188e-07, "epoch": 2.78958381771681, "percentage": 93.02, "elapsed_time": "4:37:01", "remaining_time": "0:20:47"}
1999
+ {"current_steps": 1999, "total_steps": 2148, "loss": 0.2278, "lr": 1.4784498273485436e-07, "epoch": 2.7909788421297375, "percentage": 93.06, "elapsed_time": "4:37:11", "remaining_time": "0:20:39"}
2000
+ {"current_steps": 2000, "total_steps": 2148, "loss": 0.2392, "lr": 1.458898980986917e-07, "epoch": 2.7923738665426647, "percentage": 93.11, "elapsed_time": "4:37:21", "remaining_time": "0:20:31"}
2001
+ {"current_steps": 2001, "total_steps": 2148, "loss": 0.2309, "lr": 1.4394763516115573e-07, "epoch": 2.793768890955592, "percentage": 93.16, "elapsed_time": "4:39:10", "remaining_time": "0:20:30"}
2002
+ {"current_steps": 2002, "total_steps": 2148, "loss": 0.2307, "lr": 1.4201819905256043e-07, "epoch": 2.795163915368519, "percentage": 93.2, "elapsed_time": "4:39:20", "remaining_time": "0:20:22"}
2003
+ {"current_steps": 2003, "total_steps": 2148, "loss": 0.2509, "lr": 1.4010159486933906e-07, "epoch": 2.796558939781446, "percentage": 93.25, "elapsed_time": "4:39:26", "remaining_time": "0:20:13"}
2004
+ {"current_steps": 2004, "total_steps": 2148, "loss": 0.2195, "lr": 1.3819782767403034e-07, "epoch": 2.7979539641943734, "percentage": 93.3, "elapsed_time": "4:39:35", "remaining_time": "0:20:05"}
2005
+ {"current_steps": 2005, "total_steps": 2148, "loss": 0.2365, "lr": 1.363069024952668e-07, "epoch": 2.7993489886073006, "percentage": 93.34, "elapsed_time": "4:39:43", "remaining_time": "0:19:57"}
2006
+ {"current_steps": 2006, "total_steps": 2148, "loss": 0.2437, "lr": 1.344288243277575e-07, "epoch": 2.800744013020228, "percentage": 93.39, "elapsed_time": "4:39:50", "remaining_time": "0:19:48"}
2007
+ {"current_steps": 2007, "total_steps": 2148, "loss": 0.2238, "lr": 1.3256359813227758e-07, "epoch": 2.802139037433155, "percentage": 93.44, "elapsed_time": "4:39:59", "remaining_time": "0:19:40"}
2008
+ {"current_steps": 2008, "total_steps": 2148, "loss": 0.2472, "lr": 1.3071122883565657e-07, "epoch": 2.8035340618460824, "percentage": 93.48, "elapsed_time": "4:40:06", "remaining_time": "0:19:31"}
2009
+ {"current_steps": 2009, "total_steps": 2148, "loss": 0.2465, "lr": 1.288717213307622e-07, "epoch": 2.8049290862590093, "percentage": 93.53, "elapsed_time": "4:40:13", "remaining_time": "0:19:23"}
2010
+ {"current_steps": 2010, "total_steps": 2148, "loss": 0.2487, "lr": 1.2704508047649e-07, "epoch": 2.8063241106719365, "percentage": 93.58, "elapsed_time": "4:40:19", "remaining_time": "0:19:14"}
2011
+ {"current_steps": 2011, "total_steps": 2148, "loss": 0.2023, "lr": 1.2523131109774822e-07, "epoch": 2.807719135084864, "percentage": 93.62, "elapsed_time": "4:40:30", "remaining_time": "0:19:06"}
2012
+ {"current_steps": 2012, "total_steps": 2148, "loss": 0.2171, "lr": 1.234304179854473e-07, "epoch": 2.809114159497791, "percentage": 93.67, "elapsed_time": "4:40:39", "remaining_time": "0:18:58"}
2013
+ {"current_steps": 2013, "total_steps": 2148, "loss": 0.2289, "lr": 1.2164240589648436e-07, "epoch": 2.8105091839107184, "percentage": 93.72, "elapsed_time": "4:40:51", "remaining_time": "0:18:50"}
2014
+ {"current_steps": 2014, "total_steps": 2148, "loss": 0.2267, "lr": 1.1986727955373588e-07, "epoch": 2.8119042083236456, "percentage": 93.76, "elapsed_time": "4:41:03", "remaining_time": "0:18:42"}
2015
+ {"current_steps": 2015, "total_steps": 2148, "loss": 0.2363, "lr": 1.1810504364603737e-07, "epoch": 2.813299232736573, "percentage": 93.81, "elapsed_time": "4:41:10", "remaining_time": "0:18:33"}
2016
+ {"current_steps": 2016, "total_steps": 2148, "loss": 0.2097, "lr": 1.163557028281792e-07, "epoch": 2.8146942571495, "percentage": 93.85, "elapsed_time": "4:41:17", "remaining_time": "0:18:25"}