Training in progress, epoch 4
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:88e49552a7f62898b7dab4d18292237d34d7e21794235451605c9fa021c45e04
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:56ff937e8094adec3036fcdfc26c45b77739d63a0d2281e391a2dc6b81ebed7a
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:825b3042659a01bf07eb5f22fb7da4023957a2c12cab4fd84b9723156f4972c2
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b8b151ca877becf50964b12ccba8679aebe696d059fd62300f4d84c74eb373b7
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -938,3 +938,234 @@
|
|
| 938 |
{"current_steps": 938, "total_steps": 1170, "loss": 0.182, "lr": 4.6026748657946226e-06, "epoch": 4.004264392324094, "percentage": 80.17, "elapsed_time": "10:49:12", "remaining_time": "2:40:34"}
|
| 939 |
{"current_steps": 939, "total_steps": 1170, "loss": 0.1878, "lr": 4.5646621393177e-06, "epoch": 4.008528784648187, "percentage": 80.26, "elapsed_time": "10:49:59", "remaining_time": "2:39:54"}
|
| 940 |
{"current_steps": 940, "total_steps": 1170, "loss": 0.1827, "lr": 4.5267868040104765e-06, "epoch": 4.0127931769722816, "percentage": 80.34, "elapsed_time": "10:50:37", "remaining_time": "2:39:11"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 938 |
{"current_steps": 938, "total_steps": 1170, "loss": 0.182, "lr": 4.6026748657946226e-06, "epoch": 4.004264392324094, "percentage": 80.17, "elapsed_time": "10:49:12", "remaining_time": "2:40:34"}
|
| 939 |
{"current_steps": 939, "total_steps": 1170, "loss": 0.1878, "lr": 4.5646621393177e-06, "epoch": 4.008528784648187, "percentage": 80.26, "elapsed_time": "10:49:59", "remaining_time": "2:39:54"}
|
| 940 |
{"current_steps": 940, "total_steps": 1170, "loss": 0.1827, "lr": 4.5267868040104765e-06, "epoch": 4.0127931769722816, "percentage": 80.34, "elapsed_time": "10:50:37", "remaining_time": "2:39:11"}
|
| 941 |
+
{"current_steps": 941, "total_steps": 1170, "loss": 0.1759, "lr": 4.489049197004323e-06, "epoch": 4.017057569296376, "percentage": 80.43, "elapsed_time": "10:51:15", "remaining_time": "2:38:29"}
|
| 942 |
+
{"current_steps": 942, "total_steps": 1170, "loss": 0.1906, "lr": 4.451449654204685e-06, "epoch": 4.021321961620469, "percentage": 80.51, "elapsed_time": "10:51:58", "remaining_time": "2:37:48"}
|
| 943 |
+
{"current_steps": 943, "total_steps": 1170, "loss": 0.1764, "lr": 4.413988510288072e-06, "epoch": 4.025586353944563, "percentage": 80.6, "elapsed_time": "10:52:40", "remaining_time": "2:37:06"}
|
| 944 |
+
{"current_steps": 944, "total_steps": 1170, "loss": 0.177, "lr": 4.376666098699112e-06, "epoch": 4.029850746268656, "percentage": 80.68, "elapsed_time": "10:53:22", "remaining_time": "2:36:25"}
|
| 945 |
+
{"current_steps": 945, "total_steps": 1170, "loss": 0.1705, "lr": 4.339482751647557e-06, "epoch": 4.0341151385927505, "percentage": 80.77, "elapsed_time": "10:54:06", "remaining_time": "2:35:44"}
|
| 946 |
+
{"current_steps": 946, "total_steps": 1170, "loss": 0.188, "lr": 4.302438800105335e-06, "epoch": 4.038379530916845, "percentage": 80.85, "elapsed_time": "10:54:46", "remaining_time": "2:35:02"}
|
| 947 |
+
{"current_steps": 947, "total_steps": 1170, "loss": 0.1986, "lr": 4.265534573803607e-06, "epoch": 4.042643923240938, "percentage": 80.94, "elapsed_time": "10:55:23", "remaining_time": "2:34:19"}
|
| 948 |
+
{"current_steps": 948, "total_steps": 1170, "loss": 0.1807, "lr": 4.228770401229824e-06, "epoch": 4.046908315565032, "percentage": 81.03, "elapsed_time": "10:56:06", "remaining_time": "2:33:38"}
|
| 949 |
+
{"current_steps": 949, "total_steps": 1170, "loss": 0.1644, "lr": 4.1921466096248164e-06, "epoch": 4.051172707889126, "percentage": 81.11, "elapsed_time": "10:56:45", "remaining_time": "2:32:56"}
|
| 950 |
+
{"current_steps": 950, "total_steps": 1170, "loss": 0.1818, "lr": 4.155663524979854e-06, "epoch": 4.0554371002132195, "percentage": 81.2, "elapsed_time": "10:57:21", "remaining_time": "2:32:13"}
|
| 951 |
+
{"current_steps": 951, "total_steps": 1170, "loss": 0.1853, "lr": 4.119321472033779e-06, "epoch": 4.059701492537314, "percentage": 81.28, "elapsed_time": "10:58:00", "remaining_time": "2:31:31"}
|
| 952 |
+
{"current_steps": 952, "total_steps": 1170, "loss": 0.1892, "lr": 4.083120774270095e-06, "epoch": 4.063965884861407, "percentage": 81.37, "elapsed_time": "10:58:44", "remaining_time": "2:30:50"}
|
| 953 |
+
{"current_steps": 953, "total_steps": 1170, "loss": 0.1862, "lr": 4.04706175391409e-06, "epoch": 4.068230277185501, "percentage": 81.45, "elapsed_time": "10:59:26", "remaining_time": "2:30:09"}
|
| 954 |
+
{"current_steps": 954, "total_steps": 1170, "loss": 0.1635, "lr": 4.011144731929981e-06, "epoch": 4.072494669509595, "percentage": 81.54, "elapsed_time": "11:00:08", "remaining_time": "2:29:27"}
|
| 955 |
+
{"current_steps": 955, "total_steps": 1170, "loss": 0.195, "lr": 3.975370028018022e-06, "epoch": 4.076759061833688, "percentage": 81.62, "elapsed_time": "11:00:52", "remaining_time": "2:28:47"}
|
| 956 |
+
{"current_steps": 956, "total_steps": 1170, "loss": 0.2031, "lr": 3.9397379606117045e-06, "epoch": 4.081023454157783, "percentage": 81.71, "elapsed_time": "11:01:36", "remaining_time": "2:28:05"}
|
| 957 |
+
{"current_steps": 957, "total_steps": 1170, "loss": 0.2033, "lr": 3.904248846874894e-06, "epoch": 4.085287846481877, "percentage": 81.79, "elapsed_time": "11:02:16", "remaining_time": "2:27:24"}
|
| 958 |
+
{"current_steps": 958, "total_steps": 1170, "loss": 0.1836, "lr": 3.868903002699014e-06, "epoch": 4.08955223880597, "percentage": 81.88, "elapsed_time": "11:02:59", "remaining_time": "2:26:42"}
|
| 959 |
+
{"current_steps": 959, "total_steps": 1170, "loss": 0.1682, "lr": 3.833700742700237e-06, "epoch": 4.093816631130064, "percentage": 81.97, "elapsed_time": "11:03:38", "remaining_time": "2:26:00"}
|
| 960 |
+
{"current_steps": 960, "total_steps": 1170, "loss": 0.1829, "lr": 3.7986423802166705e-06, "epoch": 4.098081023454157, "percentage": 82.05, "elapsed_time": "11:04:17", "remaining_time": "2:25:18"}
|
| 961 |
+
{"current_steps": 961, "total_steps": 1170, "loss": 0.1881, "lr": 3.7637282273055918e-06, "epoch": 4.1023454157782515, "percentage": 82.14, "elapsed_time": "11:04:58", "remaining_time": "2:24:37"}
|
| 962 |
+
{"current_steps": 962, "total_steps": 1170, "loss": 0.1681, "lr": 3.7289585947406504e-06, "epoch": 4.106609808102346, "percentage": 82.22, "elapsed_time": "11:05:42", "remaining_time": "2:23:56"}
|
| 963 |
+
{"current_steps": 963, "total_steps": 1170, "loss": 0.1707, "lr": 3.694333792009115e-06, "epoch": 4.110874200426439, "percentage": 82.31, "elapsed_time": "11:06:23", "remaining_time": "2:23:14"}
|
| 964 |
+
{"current_steps": 964, "total_steps": 1170, "loss": 0.2017, "lr": 3.6598541273091035e-06, "epoch": 4.115138592750533, "percentage": 82.39, "elapsed_time": "11:07:02", "remaining_time": "2:22:32"}
|
| 965 |
+
{"current_steps": 965, "total_steps": 1170, "loss": 0.1742, "lr": 3.6255199075468595e-06, "epoch": 4.119402985074627, "percentage": 82.48, "elapsed_time": "11:07:47", "remaining_time": "2:21:51"}
|
| 966 |
+
{"current_steps": 966, "total_steps": 1170, "loss": 0.1903, "lr": 3.5913314383339937e-06, "epoch": 4.1236673773987205, "percentage": 82.56, "elapsed_time": "11:08:32", "remaining_time": "2:21:11"}
|
| 967 |
+
{"current_steps": 967, "total_steps": 1170, "loss": 0.19, "lr": 3.5572890239847934e-06, "epoch": 4.127931769722815, "percentage": 82.65, "elapsed_time": "11:09:15", "remaining_time": "2:20:29"}
|
| 968 |
+
{"current_steps": 968, "total_steps": 1170, "loss": 0.1668, "lr": 3.5233929675134993e-06, "epoch": 4.132196162046908, "percentage": 82.74, "elapsed_time": "11:09:58", "remaining_time": "2:19:48"}
|
| 969 |
+
{"current_steps": 969, "total_steps": 1170, "loss": 0.1792, "lr": 3.4896435706316e-06, "epoch": 4.136460554371002, "percentage": 82.82, "elapsed_time": "11:10:31", "remaining_time": "2:19:05"}
|
| 970 |
+
{"current_steps": 970, "total_steps": 1170, "loss": 0.1859, "lr": 3.456041133745163e-06, "epoch": 4.140724946695096, "percentage": 82.91, "elapsed_time": "11:11:15", "remaining_time": "2:18:24"}
|
| 971 |
+
{"current_steps": 971, "total_steps": 1170, "loss": 0.1943, "lr": 3.4225859559521536e-06, "epoch": 4.144989339019189, "percentage": 82.99, "elapsed_time": "11:11:59", "remaining_time": "2:17:43"}
|
| 972 |
+
{"current_steps": 972, "total_steps": 1170, "loss": 0.1804, "lr": 3.3892783350397675e-06, "epoch": 4.149253731343284, "percentage": 83.08, "elapsed_time": "11:12:41", "remaining_time": "2:17:01"}
|
| 973 |
+
{"current_steps": 973, "total_steps": 1170, "loss": 0.1875, "lr": 3.356118567481785e-06, "epoch": 4.153518123667378, "percentage": 83.16, "elapsed_time": "11:13:23", "remaining_time": "2:16:20"}
|
| 974 |
+
{"current_steps": 974, "total_steps": 1170, "loss": 0.1614, "lr": 3.3231069484359367e-06, "epoch": 4.157782515991471, "percentage": 83.25, "elapsed_time": "11:13:54", "remaining_time": "2:15:36"}
|
| 975 |
+
{"current_steps": 975, "total_steps": 1170, "loss": 0.2, "lr": 3.290243771741275e-06, "epoch": 4.162046908315565, "percentage": 83.33, "elapsed_time": "11:14:38", "remaining_time": "2:14:55"}
|
| 976 |
+
{"current_steps": 976, "total_steps": 1170, "loss": 0.177, "lr": 3.2575293299155343e-06, "epoch": 4.166311300639659, "percentage": 83.42, "elapsed_time": "11:15:15", "remaining_time": "2:14:13"}
|
| 977 |
+
{"current_steps": 977, "total_steps": 1170, "loss": 0.1761, "lr": 3.2249639141525724e-06, "epoch": 4.1705756929637525, "percentage": 83.5, "elapsed_time": "11:15:54", "remaining_time": "2:13:31"}
|
| 978 |
+
{"current_steps": 978, "total_steps": 1170, "loss": 0.1652, "lr": 3.1925478143197418e-06, "epoch": 4.174840085287847, "percentage": 83.59, "elapsed_time": "11:16:30", "remaining_time": "2:12:48"}
|
| 979 |
+
{"current_steps": 979, "total_steps": 1170, "loss": 0.182, "lr": 3.160281318955325e-06, "epoch": 4.17910447761194, "percentage": 83.68, "elapsed_time": "11:17:14", "remaining_time": "2:12:07"}
|
| 980 |
+
{"current_steps": 980, "total_steps": 1170, "loss": 0.1783, "lr": 3.1281647152659687e-06, "epoch": 4.183368869936034, "percentage": 83.76, "elapsed_time": "11:17:58", "remaining_time": "2:11:26"}
|
| 981 |
+
{"current_steps": 981, "total_steps": 1170, "loss": 0.1845, "lr": 3.0961982891241083e-06, "epoch": 4.187633262260128, "percentage": 83.85, "elapsed_time": "11:18:41", "remaining_time": "2:10:45"}
|
| 982 |
+
{"current_steps": 982, "total_steps": 1170, "loss": 0.1883, "lr": 3.0643823250654447e-06, "epoch": 4.1918976545842215, "percentage": 83.93, "elapsed_time": "11:19:26", "remaining_time": "2:10:04"}
|
| 983 |
+
{"current_steps": 983, "total_steps": 1170, "loss": 0.1804, "lr": 3.032717106286409e-06, "epoch": 4.196162046908316, "percentage": 84.02, "elapsed_time": "11:20:05", "remaining_time": "2:09:22"}
|
| 984 |
+
{"current_steps": 984, "total_steps": 1170, "loss": 0.1876, "lr": 3.001202914641628e-06, "epoch": 4.20042643923241, "percentage": 84.1, "elapsed_time": "11:20:48", "remaining_time": "2:08:41"}
|
| 985 |
+
{"current_steps": 985, "total_steps": 1170, "loss": 0.1847, "lr": 2.9698400306414353e-06, "epoch": 4.204690831556503, "percentage": 84.19, "elapsed_time": "11:21:33", "remaining_time": "2:08:00"}
|
| 986 |
+
{"current_steps": 986, "total_steps": 1170, "loss": 0.1674, "lr": 2.9386287334493426e-06, "epoch": 4.208955223880597, "percentage": 84.27, "elapsed_time": "11:22:14", "remaining_time": "2:07:18"}
|
| 987 |
+
{"current_steps": 987, "total_steps": 1170, "loss": 0.1815, "lr": 2.907569300879596e-06, "epoch": 4.21321961620469, "percentage": 84.36, "elapsed_time": "11:22:56", "remaining_time": "2:06:37"}
|
| 988 |
+
{"current_steps": 988, "total_steps": 1170, "loss": 0.1924, "lr": 2.876662009394673e-06, "epoch": 4.217484008528785, "percentage": 84.44, "elapsed_time": "11:23:35", "remaining_time": "2:05:55"}
|
| 989 |
+
{"current_steps": 989, "total_steps": 1170, "loss": 0.1912, "lr": 2.8459071341028323e-06, "epoch": 4.221748400852879, "percentage": 84.53, "elapsed_time": "11:24:15", "remaining_time": "2:05:13"}
|
| 990 |
+
{"current_steps": 990, "total_steps": 1170, "loss": 0.1779, "lr": 2.815304948755664e-06, "epoch": 4.226012793176972, "percentage": 84.62, "elapsed_time": "11:24:59", "remaining_time": "2:04:32"}
|
| 991 |
+
{"current_steps": 991, "total_steps": 1170, "loss": 0.1872, "lr": 2.784855725745661e-06, "epoch": 4.230277185501066, "percentage": 84.7, "elapsed_time": "11:25:39", "remaining_time": "2:03:50"}
|
| 992 |
+
{"current_steps": 992, "total_steps": 1170, "loss": 0.1934, "lr": 2.7545597361037657e-06, "epoch": 4.23454157782516, "percentage": 84.79, "elapsed_time": "11:26:26", "remaining_time": "2:03:10"}
|
| 993 |
+
{"current_steps": 993, "total_steps": 1170, "loss": 0.1935, "lr": 2.7244172494969978e-06, "epoch": 4.2388059701492535, "percentage": 84.87, "elapsed_time": "11:27:04", "remaining_time": "2:02:28"}
|
| 994 |
+
{"current_steps": 994, "total_steps": 1170, "loss": 0.1746, "lr": 2.6944285342260277e-06, "epoch": 4.243070362473348, "percentage": 84.96, "elapsed_time": "11:27:39", "remaining_time": "2:01:45"}
|
| 995 |
+
{"current_steps": 995, "total_steps": 1170, "loss": 0.1745, "lr": 2.6645938572227946e-06, "epoch": 4.247334754797441, "percentage": 85.04, "elapsed_time": "11:28:22", "remaining_time": "2:01:04"}
|
| 996 |
+
{"current_steps": 996, "total_steps": 1170, "loss": 0.1826, "lr": 2.6349134840481294e-06, "epoch": 4.251599147121535, "percentage": 85.13, "elapsed_time": "11:29:05", "remaining_time": "2:00:23"}
|
| 997 |
+
{"current_steps": 997, "total_steps": 1170, "loss": 0.1765, "lr": 2.6053876788893952e-06, "epoch": 4.255863539445629, "percentage": 85.21, "elapsed_time": "11:29:48", "remaining_time": "1:59:41"}
|
| 998 |
+
{"current_steps": 998, "total_steps": 1170, "loss": 0.1779, "lr": 2.5760167045581308e-06, "epoch": 4.2601279317697225, "percentage": 85.3, "elapsed_time": "11:30:29", "remaining_time": "1:59:00"}
|
| 999 |
+
{"current_steps": 999, "total_steps": 1170, "loss": 0.178, "lr": 2.546800822487714e-06, "epoch": 4.264392324093817, "percentage": 85.38, "elapsed_time": "11:31:13", "remaining_time": "1:58:19"}
|
| 1000 |
+
{"current_steps": 1000, "total_steps": 1170, "loss": 0.1685, "lr": 2.5177402927310344e-06, "epoch": 4.268656716417911, "percentage": 85.47, "elapsed_time": "11:31:57", "remaining_time": "1:57:38"}
|
| 1001 |
+
{"current_steps": 1001, "total_steps": 1170, "loss": 0.183, "lr": 2.488835373958185e-06, "epoch": 4.272921108742004, "percentage": 85.56, "elapsed_time": "11:32:32", "remaining_time": "1:56:55"}
|
| 1002 |
+
{"current_steps": 1002, "total_steps": 1170, "loss": 0.1788, "lr": 2.4600863234541338e-06, "epoch": 4.277185501066098, "percentage": 85.64, "elapsed_time": "11:33:13", "remaining_time": "1:56:13"}
|
| 1003 |
+
{"current_steps": 1003, "total_steps": 1170, "loss": 0.1838, "lr": 2.4314933971164734e-06, "epoch": 4.281449893390192, "percentage": 85.73, "elapsed_time": "11:33:57", "remaining_time": "1:55:32"}
|
| 1004 |
+
{"current_steps": 1004, "total_steps": 1170, "loss": 0.1744, "lr": 2.4030568494531135e-06, "epoch": 4.285714285714286, "percentage": 85.81, "elapsed_time": "11:34:39", "remaining_time": "1:54:51"}
|
| 1005 |
+
{"current_steps": 1005, "total_steps": 1170, "loss": 0.1912, "lr": 2.374776933580025e-06, "epoch": 4.28997867803838, "percentage": 85.9, "elapsed_time": "11:35:23", "remaining_time": "1:54:10"}
|
| 1006 |
+
{"current_steps": 1006, "total_steps": 1170, "loss": 0.1684, "lr": 2.3466539012189913e-06, "epoch": 4.294243070362473, "percentage": 85.98, "elapsed_time": "11:36:06", "remaining_time": "1:53:28"}
|
| 1007 |
+
{"current_steps": 1007, "total_steps": 1170, "loss": 0.184, "lr": 2.318688002695355e-06, "epoch": 4.298507462686567, "percentage": 86.07, "elapsed_time": "11:36:47", "remaining_time": "1:52:47"}
|
| 1008 |
+
{"current_steps": 1008, "total_steps": 1170, "loss": 0.1831, "lr": 2.2908794869358044e-06, "epoch": 4.302771855010661, "percentage": 86.15, "elapsed_time": "11:37:29", "remaining_time": "1:52:05"}
|
| 1009 |
+
{"current_steps": 1009, "total_steps": 1170, "loss": 0.1904, "lr": 2.2632286014661477e-06, "epoch": 4.3070362473347545, "percentage": 86.24, "elapsed_time": "11:38:14", "remaining_time": "1:51:24"}
|
| 1010 |
+
{"current_steps": 1010, "total_steps": 1170, "loss": 0.1588, "lr": 2.2357355924091207e-06, "epoch": 4.311300639658849, "percentage": 86.32, "elapsed_time": "11:38:49", "remaining_time": "1:50:42"}
|
| 1011 |
+
{"current_steps": 1011, "total_steps": 1170, "loss": 0.1805, "lr": 2.2084007044821764e-06, "epoch": 4.315565031982943, "percentage": 86.41, "elapsed_time": "11:39:25", "remaining_time": "1:49:59"}
|
| 1012 |
+
{"current_steps": 1012, "total_steps": 1170, "loss": 0.1896, "lr": 2.181224180995336e-06, "epoch": 4.319829424307036, "percentage": 86.5, "elapsed_time": "11:40:06", "remaining_time": "1:49:18"}
|
| 1013 |
+
{"current_steps": 1013, "total_steps": 1170, "loss": 0.1691, "lr": 2.154206263848986e-06, "epoch": 4.32409381663113, "percentage": 86.58, "elapsed_time": "11:40:44", "remaining_time": "1:48:36"}
|
| 1014 |
+
{"current_steps": 1014, "total_steps": 1170, "loss": 0.197, "lr": 2.127347193531757e-06, "epoch": 4.3283582089552235, "percentage": 86.67, "elapsed_time": "11:41:30", "remaining_time": "1:47:55"}
|
| 1015 |
+
{"current_steps": 1015, "total_steps": 1170, "loss": 0.1767, "lr": 2.1006472091183715e-06, "epoch": 4.332622601279318, "percentage": 86.75, "elapsed_time": "11:42:15", "remaining_time": "1:47:14"}
|
| 1016 |
+
{"current_steps": 1016, "total_steps": 1170, "loss": 0.1745, "lr": 2.074106548267516e-06, "epoch": 4.336886993603412, "percentage": 86.84, "elapsed_time": "11:42:59", "remaining_time": "1:46:33"}
|
| 1017 |
+
{"current_steps": 1017, "total_steps": 1170, "loss": 0.1743, "lr": 2.0477254472197237e-06, "epoch": 4.341151385927505, "percentage": 86.92, "elapsed_time": "11:43:38", "remaining_time": "1:45:51"}
|
| 1018 |
+
{"current_steps": 1018, "total_steps": 1170, "loss": 0.1734, "lr": 2.021504140795265e-06, "epoch": 4.345415778251599, "percentage": 87.01, "elapsed_time": "11:44:20", "remaining_time": "1:45:10"}
|
| 1019 |
+
{"current_steps": 1019, "total_steps": 1170, "loss": 0.1975, "lr": 1.995442862392081e-06, "epoch": 4.349680170575693, "percentage": 87.09, "elapsed_time": "11:45:04", "remaining_time": "1:44:28"}
|
| 1020 |
+
{"current_steps": 1020, "total_steps": 1170, "loss": 0.1745, "lr": 1.96954184398368e-06, "epoch": 4.353944562899787, "percentage": 87.18, "elapsed_time": "11:45:38", "remaining_time": "1:43:46"}
|
| 1021 |
+
{"current_steps": 1021, "total_steps": 1170, "loss": 0.1663, "lr": 1.943801316117089e-06, "epoch": 4.358208955223881, "percentage": 87.26, "elapsed_time": "11:46:20", "remaining_time": "1:43:04"}
|
| 1022 |
+
{"current_steps": 1022, "total_steps": 1170, "loss": 0.1756, "lr": 1.918221507910789e-06, "epoch": 4.362473347547974, "percentage": 87.35, "elapsed_time": "11:46:57", "remaining_time": "1:42:22"}
|
| 1023 |
+
{"current_steps": 1023, "total_steps": 1170, "loss": 0.1909, "lr": 1.8928026470526917e-06, "epoch": 4.366737739872068, "percentage": 87.44, "elapsed_time": "11:47:38", "remaining_time": "1:41:41"}
|
| 1024 |
+
{"current_steps": 1024, "total_steps": 1170, "loss": 0.1906, "lr": 1.8675449597980978e-06, "epoch": 4.371002132196162, "percentage": 87.52, "elapsed_time": "11:48:19", "remaining_time": "1:40:59"}
|
| 1025 |
+
{"current_steps": 1025, "total_steps": 1170, "loss": 0.166, "lr": 1.842448670967687e-06, "epoch": 4.3752665245202556, "percentage": 87.61, "elapsed_time": "11:49:06", "remaining_time": "1:40:18"}
|
| 1026 |
+
{"current_steps": 1026, "total_steps": 1170, "loss": 0.1694, "lr": 1.817514003945524e-06, "epoch": 4.37953091684435, "percentage": 87.69, "elapsed_time": "11:49:47", "remaining_time": "1:39:37"}
|
| 1027 |
+
{"current_steps": 1027, "total_steps": 1170, "loss": 0.2076, "lr": 1.792741180677069e-06, "epoch": 4.383795309168444, "percentage": 87.78, "elapsed_time": "11:50:29", "remaining_time": "1:38:55"}
|
| 1028 |
+
{"current_steps": 1028, "total_steps": 1170, "loss": 0.1793, "lr": 1.76813042166718e-06, "epoch": 4.388059701492537, "percentage": 87.86, "elapsed_time": "11:51:09", "remaining_time": "1:38:14"}
|
| 1029 |
+
{"current_steps": 1029, "total_steps": 1170, "loss": 0.1769, "lr": 1.743681945978184e-06, "epoch": 4.392324093816631, "percentage": 87.95, "elapsed_time": "11:51:48", "remaining_time": "1:37:32"}
|
| 1030 |
+
{"current_steps": 1030, "total_steps": 1170, "loss": 0.1768, "lr": 1.7193959712279106e-06, "epoch": 4.396588486140725, "percentage": 88.03, "elapsed_time": "11:52:30", "remaining_time": "1:36:50"}
|
| 1031 |
+
{"current_steps": 1031, "total_steps": 1170, "loss": 0.1813, "lr": 1.6952727135877501e-06, "epoch": 4.400852878464819, "percentage": 88.12, "elapsed_time": "11:53:13", "remaining_time": "1:36:09"}
|
| 1032 |
+
{"current_steps": 1032, "total_steps": 1170, "loss": 0.1729, "lr": 1.6713123877807413e-06, "epoch": 4.405117270788913, "percentage": 88.21, "elapsed_time": "11:53:50", "remaining_time": "1:35:27"}
|
| 1033 |
+
{"current_steps": 1033, "total_steps": 1170, "loss": 0.184, "lr": 1.6475152070796396e-06, "epoch": 4.409381663113006, "percentage": 88.29, "elapsed_time": "11:54:35", "remaining_time": "1:34:46"}
|
| 1034 |
+
{"current_steps": 1034, "total_steps": 1170, "loss": 0.1836, "lr": 1.6238813833050504e-06, "epoch": 4.4136460554371, "percentage": 88.38, "elapsed_time": "11:55:14", "remaining_time": "1:34:04"}
|
| 1035 |
+
{"current_steps": 1035, "total_steps": 1170, "loss": 0.2054, "lr": 1.6004111268235156e-06, "epoch": 4.417910447761194, "percentage": 88.46, "elapsed_time": "11:56:01", "remaining_time": "1:33:23"}
|
| 1036 |
+
{"current_steps": 1036, "total_steps": 1170, "loss": 0.1739, "lr": 1.5771046465456574e-06, "epoch": 4.422174840085288, "percentage": 88.55, "elapsed_time": "11:56:45", "remaining_time": "1:32:42"}
|
| 1037 |
+
{"current_steps": 1037, "total_steps": 1170, "loss": 0.182, "lr": 1.5539621499243064e-06, "epoch": 4.426439232409382, "percentage": 88.63, "elapsed_time": "11:57:21", "remaining_time": "1:32:00"}
|
| 1038 |
+
{"current_steps": 1038, "total_steps": 1170, "loss": 0.2013, "lr": 1.5309838429526714e-06, "epoch": 4.430703624733475, "percentage": 88.72, "elapsed_time": "11:58:02", "remaining_time": "1:31:18"}
|
| 1039 |
+
{"current_steps": 1039, "total_steps": 1170, "loss": 0.1771, "lr": 1.5081699301624819e-06, "epoch": 4.434968017057569, "percentage": 88.8, "elapsed_time": "11:58:45", "remaining_time": "1:30:37"}
|
| 1040 |
+
{"current_steps": 1040, "total_steps": 1170, "loss": 0.1826, "lr": 1.4855206146221934e-06, "epoch": 4.439232409381663, "percentage": 88.89, "elapsed_time": "11:59:26", "remaining_time": "1:29:55"}
|
| 1041 |
+
{"current_steps": 1041, "total_steps": 1170, "loss": 0.1748, "lr": 1.4630360979351644e-06, "epoch": 4.443496801705757, "percentage": 88.97, "elapsed_time": "12:00:10", "remaining_time": "1:29:14"}
|
| 1042 |
+
{"current_steps": 1042, "total_steps": 1170, "loss": 0.1891, "lr": 1.4407165802378664e-06, "epoch": 4.447761194029851, "percentage": 89.06, "elapsed_time": "12:00:53", "remaining_time": "1:28:33"}
|
| 1043 |
+
{"current_steps": 1043, "total_steps": 1170, "loss": 0.1844, "lr": 1.4185622601981042e-06, "epoch": 4.452025586353945, "percentage": 89.15, "elapsed_time": "12:01:34", "remaining_time": "1:27:51"}
|
| 1044 |
+
{"current_steps": 1044, "total_steps": 1170, "loss": 0.186, "lr": 1.396573335013236e-06, "epoch": 4.456289978678038, "percentage": 89.23, "elapsed_time": "12:02:13", "remaining_time": "1:27:09"}
|
| 1045 |
+
{"current_steps": 1045, "total_steps": 1170, "loss": 0.1894, "lr": 1.374750000408438e-06, "epoch": 4.460554371002132, "percentage": 89.32, "elapsed_time": "12:02:56", "remaining_time": "1:26:28"}
|
| 1046 |
+
{"current_steps": 1046, "total_steps": 1170, "loss": 0.1781, "lr": 1.353092450634943e-06, "epoch": 4.464818763326226, "percentage": 89.4, "elapsed_time": "12:03:38", "remaining_time": "1:25:47"}
|
| 1047 |
+
{"current_steps": 1047, "total_steps": 1170, "loss": 0.1955, "lr": 1.3316008784683265e-06, "epoch": 4.46908315565032, "percentage": 89.49, "elapsed_time": "12:04:18", "remaining_time": "1:25:05"}
|
| 1048 |
+
{"current_steps": 1048, "total_steps": 1170, "loss": 0.1787, "lr": 1.3102754752067792e-06, "epoch": 4.473347547974414, "percentage": 89.57, "elapsed_time": "12:05:03", "remaining_time": "1:24:24"}
|
| 1049 |
+
{"current_steps": 1049, "total_steps": 1170, "loss": 0.185, "lr": 1.2891164306694148e-06, "epoch": 4.477611940298507, "percentage": 89.66, "elapsed_time": "12:05:48", "remaining_time": "1:23:43"}
|
| 1050 |
+
{"current_steps": 1050, "total_steps": 1170, "loss": 0.1917, "lr": 1.2681239331945695e-06, "epoch": 4.481876332622601, "percentage": 89.74, "elapsed_time": "12:06:31", "remaining_time": "1:23:01"}
|
| 1051 |
+
{"current_steps": 1051, "total_steps": 1170, "loss": 0.1828, "lr": 1.2472981696381315e-06, "epoch": 4.486140724946695, "percentage": 89.83, "elapsed_time": "12:07:08", "remaining_time": "1:22:19"}
|
| 1052 |
+
{"current_steps": 1052, "total_steps": 1170, "loss": 0.1951, "lr": 1.2266393253718812e-06, "epoch": 4.490405117270789, "percentage": 89.91, "elapsed_time": "12:07:47", "remaining_time": "1:21:38"}
|
| 1053 |
+
{"current_steps": 1053, "total_steps": 1170, "loss": 0.1762, "lr": 1.2061475842818337e-06, "epoch": 4.494669509594883, "percentage": 90.0, "elapsed_time": "12:08:32", "remaining_time": "1:20:56"}
|
| 1054 |
+
{"current_steps": 1054, "total_steps": 1170, "loss": 0.1809, "lr": 1.185823128766601e-06, "epoch": 4.498933901918977, "percentage": 90.09, "elapsed_time": "12:09:12", "remaining_time": "1:20:15"}
|
| 1055 |
+
{"current_steps": 1055, "total_steps": 1170, "loss": 0.1674, "lr": 1.1656661397357815e-06, "epoch": 4.50319829424307, "percentage": 90.17, "elapsed_time": "12:09:52", "remaining_time": "1:19:33"}
|
| 1056 |
+
{"current_steps": 1056, "total_steps": 1170, "loss": 0.1723, "lr": 1.1456767966083393e-06, "epoch": 4.507462686567164, "percentage": 90.26, "elapsed_time": "12:10:33", "remaining_time": "1:18:52"}
|
| 1057 |
+
{"current_steps": 1057, "total_steps": 1170, "loss": 0.1729, "lr": 1.1258552773110031e-06, "epoch": 4.5117270788912585, "percentage": 90.34, "elapsed_time": "12:11:09", "remaining_time": "1:18:09"}
|
| 1058 |
+
{"current_steps": 1058, "total_steps": 1170, "loss": 0.1752, "lr": 1.106201758276697e-06, "epoch": 4.515991471215352, "percentage": 90.43, "elapsed_time": "12:11:50", "remaining_time": "1:17:28"}
|
| 1059 |
+
{"current_steps": 1059, "total_steps": 1170, "loss": 0.1796, "lr": 1.086716414442952e-06, "epoch": 4.520255863539446, "percentage": 90.51, "elapsed_time": "12:12:26", "remaining_time": "1:16:46"}
|
| 1060 |
+
{"current_steps": 1060, "total_steps": 1170, "loss": 0.169, "lr": 1.0673994192503633e-06, "epoch": 4.524520255863539, "percentage": 90.6, "elapsed_time": "12:13:05", "remaining_time": "1:16:04"}
|
| 1061 |
+
{"current_steps": 1061, "total_steps": 1170, "loss": 0.1826, "lr": 1.048250944641045e-06, "epoch": 4.528784648187633, "percentage": 90.68, "elapsed_time": "12:13:41", "remaining_time": "1:15:22"}
|
| 1062 |
+
{"current_steps": 1062, "total_steps": 1170, "loss": 0.1892, "lr": 1.0292711610570904e-06, "epoch": 4.533049040511727, "percentage": 90.77, "elapsed_time": "12:14:23", "remaining_time": "1:14:40"}
|
| 1063 |
+
{"current_steps": 1063, "total_steps": 1170, "loss": 0.1703, "lr": 1.0104602374390593e-06, "epoch": 4.537313432835821, "percentage": 90.85, "elapsed_time": "12:15:09", "remaining_time": "1:14:00"}
|
| 1064 |
+
{"current_steps": 1064, "total_steps": 1170, "loss": 0.1771, "lr": 9.918183412244863e-07, "epoch": 4.541577825159915, "percentage": 90.94, "elapsed_time": "12:15:54", "remaining_time": "1:13:18"}
|
| 1065 |
+
{"current_steps": 1065, "total_steps": 1170, "loss": 0.1809, "lr": 9.733456383463658e-07, "epoch": 4.545842217484008, "percentage": 91.03, "elapsed_time": "12:16:30", "remaining_time": "1:12:36"}
|
| 1066 |
+
{"current_steps": 1066, "total_steps": 1170, "loss": 0.1882, "lr": 9.550422932316938e-07, "epoch": 4.550106609808102, "percentage": 91.11, "elapsed_time": "12:17:12", "remaining_time": "1:11:55"}
|
| 1067 |
+
{"current_steps": 1067, "total_steps": 1170, "loss": 0.2033, "lr": 9.369084688000063e-07, "epoch": 4.554371002132196, "percentage": 91.2, "elapsed_time": "12:17:57", "remaining_time": "1:11:14"}
|
| 1068 |
+
{"current_steps": 1068, "total_steps": 1170, "loss": 0.1724, "lr": 9.189443264619102e-07, "epoch": 4.55863539445629, "percentage": 91.28, "elapsed_time": "12:18:37", "remaining_time": "1:10:32"}
|
| 1069 |
+
{"current_steps": 1069, "total_steps": 1170, "loss": 0.1894, "lr": 9.011500261176742e-07, "epoch": 4.562899786780384, "percentage": 91.37, "elapsed_time": "12:19:23", "remaining_time": "1:09:51"}
|
| 1070 |
+
{"current_steps": 1070, "total_steps": 1170, "loss": 0.1835, "lr": 8.835257261557695e-07, "epoch": 4.567164179104478, "percentage": 91.45, "elapsed_time": "12:20:05", "remaining_time": "1:09:10"}
|
| 1071 |
+
{"current_steps": 1071, "total_steps": 1170, "loss": 0.1734, "lr": 8.660715834514977e-07, "epoch": 4.571428571428571, "percentage": 91.54, "elapsed_time": "12:20:45", "remaining_time": "1:08:28"}
|
| 1072 |
+
{"current_steps": 1072, "total_steps": 1170, "loss": 0.1796, "lr": 8.487877533655698e-07, "epoch": 4.575692963752665, "percentage": 91.62, "elapsed_time": "12:21:27", "remaining_time": "1:07:46"}
|
| 1073 |
+
{"current_steps": 1073, "total_steps": 1170, "loss": 0.1705, "lr": 8.316743897427315e-07, "epoch": 4.5799573560767595, "percentage": 91.71, "elapsed_time": "12:22:06", "remaining_time": "1:07:05"}
|
| 1074 |
+
{"current_steps": 1074, "total_steps": 1170, "loss": 0.1795, "lr": 8.147316449103959e-07, "epoch": 4.584221748400853, "percentage": 91.79, "elapsed_time": "12:22:47", "remaining_time": "1:06:23"}
|
| 1075 |
+
{"current_steps": 1075, "total_steps": 1170, "loss": 0.1888, "lr": 7.979596696772773e-07, "epoch": 4.588486140724947, "percentage": 91.88, "elapsed_time": "12:23:26", "remaining_time": "1:05:41"}
|
| 1076 |
+
{"current_steps": 1076, "total_steps": 1170, "loss": 0.193, "lr": 7.813586133320661e-07, "epoch": 4.59275053304904, "percentage": 91.97, "elapsed_time": "12:24:09", "remaining_time": "1:05:00"}
|
| 1077 |
+
{"current_steps": 1077, "total_steps": 1170, "loss": 0.1924, "lr": 7.649286236420806e-07, "epoch": 4.597014925373134, "percentage": 92.05, "elapsed_time": "12:24:51", "remaining_time": "1:04:19"}
|
| 1078 |
+
{"current_steps": 1078, "total_steps": 1170, "loss": 0.184, "lr": 7.486698468519682e-07, "epoch": 4.601279317697228, "percentage": 92.14, "elapsed_time": "12:25:34", "remaining_time": "1:03:37"}
|
| 1079 |
+
{"current_steps": 1079, "total_steps": 1170, "loss": 0.175, "lr": 7.325824276823934e-07, "epoch": 4.605543710021322, "percentage": 92.22, "elapsed_time": "12:26:16", "remaining_time": "1:02:56"}
|
| 1080 |
+
{"current_steps": 1080, "total_steps": 1170, "loss": 0.1747, "lr": 7.166665093287539e-07, "epoch": 4.609808102345416, "percentage": 92.31, "elapsed_time": "12:26:57", "remaining_time": "1:02:14"}
|
| 1081 |
+
{"current_steps": 1081, "total_steps": 1170, "loss": 0.1788, "lr": 7.009222334599019e-07, "epoch": 4.61407249466951, "percentage": 92.39, "elapsed_time": "12:27:42", "remaining_time": "1:01:33"}
|
| 1082 |
+
{"current_steps": 1082, "total_steps": 1170, "loss": 0.1799, "lr": 6.853497402168896e-07, "epoch": 4.618336886993603, "percentage": 92.48, "elapsed_time": "12:28:23", "remaining_time": "1:00:52"}
|
| 1083 |
+
{"current_steps": 1083, "total_steps": 1170, "loss": 0.1917, "lr": 6.69949168211721e-07, "epoch": 4.622601279317697, "percentage": 92.56, "elapsed_time": "12:29:02", "remaining_time": "1:00:10"}
|
| 1084 |
+
{"current_steps": 1084, "total_steps": 1170, "loss": 0.1886, "lr": 6.547206545261109e-07, "epoch": 4.6268656716417915, "percentage": 92.65, "elapsed_time": "12:29:42", "remaining_time": "0:59:28"}
|
| 1085 |
+
{"current_steps": 1085, "total_steps": 1170, "loss": 0.1834, "lr": 6.396643347102683e-07, "epoch": 4.631130063965885, "percentage": 92.74, "elapsed_time": "12:30:26", "remaining_time": "0:58:47"}
|
| 1086 |
+
{"current_steps": 1086, "total_steps": 1170, "loss": 0.1809, "lr": 6.247803427816945e-07, "epoch": 4.635394456289979, "percentage": 92.82, "elapsed_time": "12:31:05", "remaining_time": "0:58:05"}
|
| 1087 |
+
{"current_steps": 1087, "total_steps": 1170, "loss": 0.1807, "lr": 6.10068811223985e-07, "epoch": 4.639658848614072, "percentage": 92.91, "elapsed_time": "12:31:48", "remaining_time": "0:57:24"}
|
| 1088 |
+
{"current_steps": 1088, "total_steps": 1170, "loss": 0.1844, "lr": 5.955298709856516e-07, "epoch": 4.643923240938166, "percentage": 92.99, "elapsed_time": "12:32:31", "remaining_time": "0:56:42"}
|
| 1089 |
+
{"current_steps": 1089, "total_steps": 1170, "loss": 0.1772, "lr": 5.811636514789598e-07, "epoch": 4.6481876332622605, "percentage": 93.08, "elapsed_time": "12:33:11", "remaining_time": "0:56:01"}
|
| 1090 |
+
{"current_steps": 1090, "total_steps": 1170, "loss": 0.1989, "lr": 5.669702805787714e-07, "epoch": 4.652452025586354, "percentage": 93.16, "elapsed_time": "12:33:49", "remaining_time": "0:55:19"}
|
| 1091 |
+
{"current_steps": 1091, "total_steps": 1170, "loss": 0.1863, "lr": 5.529498846214054e-07, "epoch": 4.656716417910448, "percentage": 93.25, "elapsed_time": "12:34:30", "remaining_time": "0:54:38"}
|
| 1092 |
+
{"current_steps": 1092, "total_steps": 1170, "loss": 0.1677, "lr": 5.391025884035239e-07, "epoch": 4.660980810234541, "percentage": 93.33, "elapsed_time": "12:35:13", "remaining_time": "0:53:56"}
|
| 1093 |
+
{"current_steps": 1093, "total_steps": 1170, "loss": 0.1751, "lr": 5.254285151810124e-07, "epoch": 4.665245202558635, "percentage": 93.42, "elapsed_time": "12:35:54", "remaining_time": "0:53:15"}
|
| 1094 |
+
{"current_steps": 1094, "total_steps": 1170, "loss": 0.1935, "lr": 5.119277866678829e-07, "epoch": 4.669509594882729, "percentage": 93.5, "elapsed_time": "12:36:35", "remaining_time": "0:52:33"}
|
| 1095 |
+
{"current_steps": 1095, "total_steps": 1170, "loss": 0.184, "lr": 4.986005230351954e-07, "epoch": 4.673773987206823, "percentage": 93.59, "elapsed_time": "12:37:19", "remaining_time": "0:51:52"}
|
| 1096 |
+
{"current_steps": 1096, "total_steps": 1170, "loss": 0.1735, "lr": 4.854468429099801e-07, "epoch": 4.678038379530917, "percentage": 93.68, "elapsed_time": "12:38:03", "remaining_time": "0:51:10"}
|
| 1097 |
+
{"current_steps": 1097, "total_steps": 1170, "loss": 0.1765, "lr": 4.7246686337419247e-07, "epoch": 4.682302771855011, "percentage": 93.76, "elapsed_time": "12:38:45", "remaining_time": "0:50:29"}
|
| 1098 |
+
{"current_steps": 1098, "total_steps": 1170, "loss": 0.2019, "lr": 4.5966069996365993e-07, "epoch": 4.686567164179104, "percentage": 93.85, "elapsed_time": "12:39:27", "remaining_time": "0:49:48"}
|
| 1099 |
+
{"current_steps": 1099, "total_steps": 1170, "loss": 0.1736, "lr": 4.470284666670632e-07, "epoch": 4.690831556503198, "percentage": 93.93, "elapsed_time": "12:40:08", "remaining_time": "0:49:06"}
|
| 1100 |
+
{"current_steps": 1100, "total_steps": 1170, "loss": 0.1636, "lr": 4.345702759249171e-07, "epoch": 4.6950959488272925, "percentage": 94.02, "elapsed_time": "12:40:47", "remaining_time": "0:48:24"}
|
| 1101 |
+
{"current_steps": 1101, "total_steps": 1170, "loss": 0.1911, "lr": 4.22286238628562e-07, "epoch": 4.699360341151386, "percentage": 94.1, "elapsed_time": "12:41:33", "remaining_time": "0:47:43"}
|
| 1102 |
+
{"current_steps": 1102, "total_steps": 1170, "loss": 0.1851, "lr": 4.101764641191963e-07, "epoch": 4.70362473347548, "percentage": 94.19, "elapsed_time": "12:42:16", "remaining_time": "0:47:02"}
|
| 1103 |
+
{"current_steps": 1103, "total_steps": 1170, "loss": 0.1791, "lr": 3.982410601868858e-07, "epoch": 4.707889125799573, "percentage": 94.27, "elapsed_time": "12:42:53", "remaining_time": "0:46:20"}
|
| 1104 |
+
{"current_steps": 1104, "total_steps": 1170, "loss": 0.1772, "lr": 3.8648013306960664e-07, "epoch": 4.712153518123667, "percentage": 94.36, "elapsed_time": "12:43:34", "remaining_time": "0:45:38"}
|
| 1105 |
+
{"current_steps": 1105, "total_steps": 1170, "loss": 0.1687, "lr": 3.748937874523062e-07, "epoch": 4.7164179104477615, "percentage": 94.44, "elapsed_time": "12:44:11", "remaining_time": "0:44:57"}
|
| 1106 |
+
{"current_steps": 1106, "total_steps": 1170, "loss": 0.168, "lr": 3.634821264659727e-07, "epoch": 4.720682302771855, "percentage": 94.53, "elapsed_time": "12:44:55", "remaining_time": "0:44:15"}
|
| 1107 |
+
{"current_steps": 1107, "total_steps": 1170, "loss": 0.1805, "lr": 3.522452516867048e-07, "epoch": 4.724946695095949, "percentage": 94.62, "elapsed_time": "12:45:35", "remaining_time": "0:43:34"}
|
| 1108 |
+
{"current_steps": 1108, "total_steps": 1170, "loss": 0.1812, "lr": 3.4118326313481887e-07, "epoch": 4.729211087420042, "percentage": 94.7, "elapsed_time": "12:46:18", "remaining_time": "0:42:52"}
|
| 1109 |
+
{"current_steps": 1109, "total_steps": 1170, "loss": 0.1812, "lr": 3.3029625927395446e-07, "epoch": 4.733475479744136, "percentage": 94.79, "elapsed_time": "12:46:59", "remaining_time": "0:42:11"}
|
| 1110 |
+
{"current_steps": 1110, "total_steps": 1170, "loss": 0.1882, "lr": 3.1958433701019697e-07, "epoch": 4.73773987206823, "percentage": 94.87, "elapsed_time": "12:47:42", "remaining_time": "0:41:29"}
|
| 1111 |
+
{"current_steps": 1111, "total_steps": 1170, "loss": 0.1605, "lr": 3.09047591691225e-07, "epoch": 4.742004264392325, "percentage": 94.96, "elapsed_time": "12:48:22", "remaining_time": "0:40:48"}
|
| 1112 |
+
{"current_steps": 1112, "total_steps": 1170, "loss": 0.1673, "lr": 2.9868611710543785e-07, "epoch": 4.746268656716418, "percentage": 95.04, "elapsed_time": "12:49:01", "remaining_time": "0:40:06"}
|
| 1113 |
+
{"current_steps": 1113, "total_steps": 1170, "loss": 0.1841, "lr": 2.8850000548115155e-07, "epoch": 4.750533049040512, "percentage": 95.13, "elapsed_time": "12:49:46", "remaining_time": "0:39:25"}
|
| 1114 |
+
{"current_steps": 1114, "total_steps": 1170, "loss": 0.2004, "lr": 2.7848934748574863e-07, "epoch": 4.754797441364605, "percentage": 95.21, "elapsed_time": "12:50:33", "remaining_time": "0:38:44"}
|
| 1115 |
+
{"current_steps": 1115, "total_steps": 1170, "loss": 0.1912, "lr": 2.686542322248986e-07, "epoch": 4.759061833688699, "percentage": 95.3, "elapsed_time": "12:51:14", "remaining_time": "0:38:02"}
|
| 1116 |
+
{"current_steps": 1116, "total_steps": 1170, "loss": 0.1726, "lr": 2.5899474724174313e-07, "epoch": 4.7633262260127935, "percentage": 95.38, "elapsed_time": "12:51:57", "remaining_time": "0:37:21"}
|
| 1117 |
+
{"current_steps": 1117, "total_steps": 1170, "loss": 0.1842, "lr": 2.495109785161232e-07, "epoch": 4.767590618336887, "percentage": 95.47, "elapsed_time": "12:52:34", "remaining_time": "0:36:39"}
|
| 1118 |
+
{"current_steps": 1118, "total_steps": 1170, "loss": 0.1869, "lr": 2.402030104638198e-07, "epoch": 4.771855010660981, "percentage": 95.56, "elapsed_time": "12:53:18", "remaining_time": "0:35:58"}
|
| 1119 |
+
{"current_steps": 1119, "total_steps": 1170, "loss": 0.1925, "lr": 2.3107092593579905e-07, "epoch": 4.776119402985074, "percentage": 95.64, "elapsed_time": "12:54:03", "remaining_time": "0:35:16"}
|
| 1120 |
+
{"current_steps": 1120, "total_steps": 1170, "loss": 0.1822, "lr": 2.2211480621746828e-07, "epoch": 4.780383795309168, "percentage": 95.73, "elapsed_time": "12:54:45", "remaining_time": "0:34:35"}
|
| 1121 |
+
{"current_steps": 1121, "total_steps": 1170, "loss": 0.1845, "lr": 2.133347310279632e-07, "epoch": 4.7846481876332625, "percentage": 95.81, "elapsed_time": "12:55:27", "remaining_time": "0:33:53"}
|
| 1122 |
+
{"current_steps": 1122, "total_steps": 1170, "loss": 0.1832, "lr": 2.0473077851942858e-07, "epoch": 4.788912579957356, "percentage": 95.9, "elapsed_time": "12:56:02", "remaining_time": "0:33:11"}
|
| 1123 |
+
{"current_steps": 1123, "total_steps": 1170, "loss": 0.19, "lr": 1.9630302527633427e-07, "epoch": 4.79317697228145, "percentage": 95.98, "elapsed_time": "12:56:45", "remaining_time": "0:32:30"}
|
| 1124 |
+
{"current_steps": 1124, "total_steps": 1170, "loss": 0.1985, "lr": 1.8805154631477808e-07, "epoch": 4.797441364605544, "percentage": 96.07, "elapsed_time": "12:57:28", "remaining_time": "0:31:49"}
|
| 1125 |
+
{"current_steps": 1125, "total_steps": 1170, "loss": 0.1889, "lr": 1.799764150818306e-07, "epoch": 4.801705756929637, "percentage": 96.15, "elapsed_time": "12:58:13", "remaining_time": "0:31:07"}
|
| 1126 |
+
{"current_steps": 1126, "total_steps": 1170, "loss": 0.2025, "lr": 1.7207770345488263e-07, "epoch": 4.8059701492537314, "percentage": 96.24, "elapsed_time": "12:58:57", "remaining_time": "0:30:26"}
|
| 1127 |
+
{"current_steps": 1127, "total_steps": 1170, "loss": 0.1651, "lr": 1.6435548174098536e-07, "epoch": 4.810234541577826, "percentage": 96.32, "elapsed_time": "12:59:37", "remaining_time": "0:29:44"}
|
| 1128 |
+
{"current_steps": 1128, "total_steps": 1170, "loss": 0.1999, "lr": 1.5680981867625566e-07, "epoch": 4.814498933901919, "percentage": 96.41, "elapsed_time": "13:00:20", "remaining_time": "0:29:03"}
|
| 1129 |
+
{"current_steps": 1129, "total_steps": 1170, "loss": 0.1882, "lr": 1.4944078142523854e-07, "epoch": 4.818763326226013, "percentage": 96.5, "elapsed_time": "13:01:03", "remaining_time": "0:28:21"}
|
| 1130 |
+
{"current_steps": 1130, "total_steps": 1170, "loss": 0.1663, "lr": 1.4224843558031888e-07, "epoch": 4.823027718550106, "percentage": 96.58, "elapsed_time": "13:01:43", "remaining_time": "0:27:40"}
|
| 1131 |
+
{"current_steps": 1131, "total_steps": 1170, "loss": 0.1822, "lr": 1.3523284516113955e-07, "epoch": 4.8272921108742, "percentage": 96.67, "elapsed_time": "13:02:23", "remaining_time": "0:26:58"}
|
| 1132 |
+
{"current_steps": 1132, "total_steps": 1170, "loss": 0.1883, "lr": 1.2839407261403091e-07, "epoch": 4.8315565031982945, "percentage": 96.75, "elapsed_time": "13:03:08", "remaining_time": "0:26:17"}
|
| 1133 |
+
{"current_steps": 1133, "total_steps": 1170, "loss": 0.1968, "lr": 1.2173217881144894e-07, "epoch": 4.835820895522388, "percentage": 96.84, "elapsed_time": "13:03:47", "remaining_time": "0:25:35"}
|
| 1134 |
+
{"current_steps": 1134, "total_steps": 1170, "loss": 0.1906, "lr": 1.1524722305144231e-07, "epoch": 4.840085287846482, "percentage": 96.92, "elapsed_time": "13:04:31", "remaining_time": "0:24:54"}
|
| 1135 |
+
{"current_steps": 1135, "total_steps": 1170, "loss": 0.1822, "lr": 1.0893926305711289e-07, "epoch": 4.844349680170575, "percentage": 97.01, "elapsed_time": "13:05:11", "remaining_time": "0:24:12"}
|
| 1136 |
+
{"current_steps": 1136, "total_steps": 1170, "loss": 0.1701, "lr": 1.0280835497612052e-07, "epoch": 4.848614072494669, "percentage": 97.09, "elapsed_time": "13:05:49", "remaining_time": "0:23:31"}
|
| 1137 |
+
{"current_steps": 1137, "total_steps": 1170, "loss": 0.1945, "lr": 9.685455338016347e-08, "epoch": 4.8528784648187635, "percentage": 97.18, "elapsed_time": "13:06:34", "remaining_time": "0:22:49"}
|
| 1138 |
+
{"current_steps": 1138, "total_steps": 1170, "loss": 0.1802, "lr": 9.107791126450106e-08, "epoch": 4.857142857142857, "percentage": 97.26, "elapsed_time": "13:07:18", "remaining_time": "0:22:08"}
|
| 1139 |
+
{"current_steps": 1139, "total_steps": 1170, "loss": 0.1687, "lr": 8.547848004748505e-08, "epoch": 4.861407249466951, "percentage": 97.35, "elapsed_time": "13:07:55", "remaining_time": "0:21:26"}
|
| 1140 |
+
{"current_steps": 1140, "total_steps": 1170, "loss": 0.1779, "lr": 8.005630957010014e-08, "epoch": 4.865671641791045, "percentage": 97.44, "elapsed_time": "13:08:38", "remaining_time": "0:20:45"}
|
| 1141 |
+
{"current_steps": 1141, "total_steps": 1170, "loss": 0.1659, "lr": 7.481144809551311e-08, "epoch": 4.869936034115138, "percentage": 97.52, "elapsed_time": "13:09:19", "remaining_time": "0:20:03"}
|
| 1142 |
+
{"current_steps": 1142, "total_steps": 1170, "loss": 0.1673, "lr": 6.974394230865766e-08, "epoch": 4.8742004264392325, "percentage": 97.61, "elapsed_time": "13:09:57", "remaining_time": "0:19:22"}
|
| 1143 |
+
{"current_steps": 1143, "total_steps": 1170, "loss": 0.1815, "lr": 6.485383731580142e-08, "epoch": 4.878464818763327, "percentage": 97.69, "elapsed_time": "13:10:43", "remaining_time": "0:18:40"}
|
| 1144 |
+
{"current_steps": 1144, "total_steps": 1170, "loss": 0.1667, "lr": 6.014117664415953e-08, "epoch": 4.88272921108742, "percentage": 97.78, "elapsed_time": "13:11:21", "remaining_time": "0:17:59"}
|
| 1145 |
+
{"current_steps": 1145, "total_steps": 1170, "loss": 0.1848, "lr": 5.560600224149948e-08, "epoch": 4.886993603411514, "percentage": 97.86, "elapsed_time": "13:12:09", "remaining_time": "0:17:17"}
|
| 1146 |
+
{"current_steps": 1146, "total_steps": 1170, "loss": 0.1977, "lr": 5.1248354475768034e-08, "epoch": 4.891257995735607, "percentage": 97.95, "elapsed_time": "13:12:52", "remaining_time": "0:16:36"}
|
| 1147 |
+
{"current_steps": 1147, "total_steps": 1170, "loss": 0.197, "lr": 4.706827213473819e-08, "epoch": 4.895522388059701, "percentage": 98.03, "elapsed_time": "13:13:32", "remaining_time": "0:15:54"}
|
| 1148 |
+
{"current_steps": 1148, "total_steps": 1170, "loss": 0.1752, "lr": 4.3065792425651675e-08, "epoch": 4.899786780383796, "percentage": 98.12, "elapsed_time": "13:14:08", "remaining_time": "0:15:13"}
|
| 1149 |
+
{"current_steps": 1149, "total_steps": 1170, "loss": 0.1769, "lr": 3.924095097489922e-08, "epoch": 4.904051172707889, "percentage": 98.21, "elapsed_time": "13:14:54", "remaining_time": "0:14:31"}
|
| 1150 |
+
{"current_steps": 1150, "total_steps": 1170, "loss": 0.1857, "lr": 3.559378182770079e-08, "epoch": 4.908315565031983, "percentage": 98.29, "elapsed_time": "13:15:41", "remaining_time": "0:13:50"}
|
| 1151 |
+
{"current_steps": 1151, "total_steps": 1170, "loss": 0.1762, "lr": 3.212431744779476e-08, "epoch": 4.912579957356077, "percentage": 98.38, "elapsed_time": "13:16:20", "remaining_time": "0:13:08"}
|
| 1152 |
+
{"current_steps": 1152, "total_steps": 1170, "loss": 0.1852, "lr": 2.8832588717164766e-08, "epoch": 4.91684434968017, "percentage": 98.46, "elapsed_time": "13:17:04", "remaining_time": "0:12:27"}
|
| 1153 |
+
{"current_steps": 1153, "total_steps": 1170, "loss": 0.1806, "lr": 2.5718624935744395e-08, "epoch": 4.9211087420042645, "percentage": 98.55, "elapsed_time": "13:17:41", "remaining_time": "0:11:45"}
|
| 1154 |
+
{"current_steps": 1154, "total_steps": 1170, "loss": 0.1905, "lr": 2.2782453821177386e-08, "epoch": 4.925373134328359, "percentage": 98.63, "elapsed_time": "13:18:18", "remaining_time": "0:11:04"}
|
| 1155 |
+
{"current_steps": 1155, "total_steps": 1170, "loss": 0.1682, "lr": 2.0024101508555604e-08, "epoch": 4.929637526652452, "percentage": 98.72, "elapsed_time": "13:18:57", "remaining_time": "0:10:22"}
|
| 1156 |
+
{"current_steps": 1156, "total_steps": 1170, "loss": 0.1802, "lr": 1.7443592550190346e-08, "epoch": 4.933901918976546, "percentage": 98.8, "elapsed_time": "13:19:36", "remaining_time": "0:09:41"}
|
| 1157 |
+
{"current_steps": 1157, "total_steps": 1170, "loss": 0.1896, "lr": 1.5040949915399173e-08, "epoch": 4.938166311300639, "percentage": 98.89, "elapsed_time": "13:20:19", "remaining_time": "0:08:59"}
|
| 1158 |
+
{"current_steps": 1158, "total_steps": 1170, "loss": 0.1926, "lr": 1.281619499029274e-08, "epoch": 4.9424307036247335, "percentage": 98.97, "elapsed_time": "13:21:03", "remaining_time": "0:08:18"}
|
| 1159 |
+
{"current_steps": 1159, "total_steps": 1170, "loss": 0.1852, "lr": 1.0769347577594958e-08, "epoch": 4.946695095948828, "percentage": 99.06, "elapsed_time": "13:21:49", "remaining_time": "0:07:36"}
|
| 1160 |
+
{"current_steps": 1160, "total_steps": 1170, "loss": 0.1724, "lr": 8.900425896454234e-09, "epoch": 4.950959488272921, "percentage": 99.15, "elapsed_time": "13:22:26", "remaining_time": "0:06:55"}
|
| 1161 |
+
{"current_steps": 1161, "total_steps": 1170, "loss": 0.1983, "lr": 7.209446582292501e-09, "epoch": 4.955223880597015, "percentage": 99.23, "elapsed_time": "13:23:01", "remaining_time": "0:06:13"}
|
| 1162 |
+
{"current_steps": 1162, "total_steps": 1170, "loss": 0.1728, "lr": 5.6964246866497705e-09, "epoch": 4.959488272921108, "percentage": 99.32, "elapsed_time": "13:23:40", "remaining_time": "0:05:31"}
|
| 1163 |
+
{"current_steps": 1163, "total_steps": 1170, "loss": 0.1821, "lr": 4.361373677055358e-09, "epoch": 4.963752665245202, "percentage": 99.4, "elapsed_time": "13:24:18", "remaining_time": "0:04:50"}
|
| 1164 |
+
{"current_steps": 1164, "total_steps": 1170, "loss": 0.1897, "lr": 3.2043054369057523e-09, "epoch": 4.968017057569297, "percentage": 99.49, "elapsed_time": "13:25:02", "remaining_time": "0:04:08"}
|
| 1165 |
+
{"current_steps": 1165, "total_steps": 1170, "loss": 0.186, "lr": 2.2252302653558155e-09, "epoch": 4.97228144989339, "percentage": 99.57, "elapsed_time": "13:25:43", "remaining_time": "0:03:27"}
|
| 1166 |
+
{"current_steps": 1166, "total_steps": 1170, "loss": 0.1861, "lr": 1.4241568772321856e-09, "epoch": 4.976545842217484, "percentage": 99.66, "elapsed_time": "13:26:23", "remaining_time": "0:02:45"}
|
| 1167 |
+
{"current_steps": 1167, "total_steps": 1170, "loss": 0.1736, "lr": 8.010924029533406e-10, "epoch": 4.980810234541578, "percentage": 99.74, "elapsed_time": "13:26:59", "remaining_time": "0:02:04"}
|
| 1168 |
+
{"current_steps": 1168, "total_steps": 1170, "loss": 0.1725, "lr": 3.560423884629849e-10, "epoch": 4.985074626865671, "percentage": 99.83, "elapsed_time": "13:27:38", "remaining_time": "0:01:22"}
|
| 1169 |
+
{"current_steps": 1169, "total_steps": 1170, "loss": 0.1762, "lr": 8.901079518786048e-11, "epoch": 4.9893390191897655, "percentage": 99.91, "elapsed_time": "13:28:20", "remaining_time": "0:00:41"}
|
| 1170 |
+
{"current_steps": 1170, "total_steps": 1170, "loss": 0.1743, "lr": 0.0, "epoch": 4.99360341151386, "percentage": 100.0, "elapsed_time": "13:28:54", "remaining_time": "0:00:00"}
|
| 1171 |
+
{"current_steps": 1170, "total_steps": 1170, "epoch": 4.99360341151386, "percentage": 100.0, "elapsed_time": "13:30:25", "remaining_time": "0:00:00"}
|