Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5530940438d0305c4152fbf1f4cc2489aa44f5697b4db134d4200155410ec8d9
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bc81b2ac672ce52f29f38d321e8af2021ac911bf3c662edf149e1a6d97ae2840
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9d6827660fcbaec1a7148d2f028754c0f2e720adf7af932eed642acb23617999
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d5c2f9a89e38f1603006efd5756af2d9543cd5f257db1e9268cb798461256e2a
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -110,3 +110,114 @@
|
|
| 110 |
{"current_steps": 110, "total_steps": 333, "loss": 0.4766, "lr": 6.791036400297142e-05, "epoch": 0.9887640449438202, "percentage": 33.03, "elapsed_time": "2:58:38", "remaining_time": "6:02:08"}
|
| 111 |
{"current_steps": 111, "total_steps": 333, "loss": 0.4796, "lr": 6.760776875960347e-05, "epoch": 0.9977528089887641, "percentage": 33.33, "elapsed_time": "3:00:14", "remaining_time": "6:00:29"}
|
| 112 |
{"current_steps": 112, "total_steps": 333, "loss": 0.8205, "lr": 6.730212572874618e-05, "epoch": 1.006741573033708, "percentage": 33.63, "elapsed_time": "3:03:21", "remaining_time": "6:01:47"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 110 |
{"current_steps": 110, "total_steps": 333, "loss": 0.4766, "lr": 6.791036400297142e-05, "epoch": 0.9887640449438202, "percentage": 33.03, "elapsed_time": "2:58:38", "remaining_time": "6:02:08"}
|
| 111 |
{"current_steps": 111, "total_steps": 333, "loss": 0.4796, "lr": 6.760776875960347e-05, "epoch": 0.9977528089887641, "percentage": 33.33, "elapsed_time": "3:00:14", "remaining_time": "6:00:29"}
|
| 112 |
{"current_steps": 112, "total_steps": 333, "loss": 0.8205, "lr": 6.730212572874618e-05, "epoch": 1.006741573033708, "percentage": 33.63, "elapsed_time": "3:03:21", "remaining_time": "6:01:47"}
|
| 113 |
+
{"current_steps": 113, "total_steps": 333, "loss": 0.4547, "lr": 6.699346865217031e-05, "epoch": 1.0157303370786517, "percentage": 33.93, "elapsed_time": "3:04:57", "remaining_time": "6:00:06"}
|
| 114 |
+
{"current_steps": 114, "total_steps": 333, "loss": 0.4598, "lr": 6.668183160438531e-05, "epoch": 1.0247191011235954, "percentage": 34.23, "elapsed_time": "3:06:34", "remaining_time": "5:58:26"}
|
| 115 |
+
{"current_steps": 115, "total_steps": 333, "loss": 0.4566, "lr": 6.636724898887751e-05, "epoch": 1.0337078651685394, "percentage": 34.53, "elapsed_time": "3:08:12", "remaining_time": "5:56:46"}
|
| 116 |
+
{"current_steps": 116, "total_steps": 333, "loss": 0.4636, "lr": 6.604975553431219e-05, "epoch": 1.0426966292134832, "percentage": 34.83, "elapsed_time": "3:09:49", "remaining_time": "5:55:05"}
|
| 117 |
+
{"current_steps": 117, "total_steps": 333, "loss": 0.4539, "lr": 6.572938629069959e-05, "epoch": 1.051685393258427, "percentage": 35.14, "elapsed_time": "3:11:26", "remaining_time": "5:53:25"}
|
| 118 |
+
{"current_steps": 118, "total_steps": 333, "loss": 0.4626, "lr": 6.540617662552565e-05, "epoch": 1.060674157303371, "percentage": 35.44, "elapsed_time": "3:13:03", "remaining_time": "5:51:46"}
|
| 119 |
+
{"current_steps": 119, "total_steps": 333, "loss": 0.4507, "lr": 6.508016221984747e-05, "epoch": 1.0696629213483146, "percentage": 35.74, "elapsed_time": "3:14:40", "remaining_time": "5:50:06"}
|
| 120 |
+
{"current_steps": 120, "total_steps": 333, "loss": 0.4613, "lr": 6.475137906435435e-05, "epoch": 1.0786516853932584, "percentage": 36.04, "elapsed_time": "3:16:17", "remaining_time": "5:48:25"}
|
| 121 |
+
{"current_steps": 121, "total_steps": 333, "loss": 0.4656, "lr": 6.441986345539446e-05, "epoch": 1.0876404494382022, "percentage": 36.34, "elapsed_time": "3:17:54", "remaining_time": "5:46:45"}
|
| 122 |
+
{"current_steps": 122, "total_steps": 333, "loss": 0.4529, "lr": 6.408565199096798e-05, "epoch": 1.0966292134831461, "percentage": 36.64, "elapsed_time": "3:19:31", "remaining_time": "5:45:05"}
|
| 123 |
+
{"current_steps": 123, "total_steps": 333, "loss": 0.4588, "lr": 6.374878156668676e-05, "epoch": 1.1056179775280899, "percentage": 36.94, "elapsed_time": "3:21:09", "remaining_time": "5:43:27"}
|
| 124 |
+
{"current_steps": 124, "total_steps": 333, "loss": 0.4551, "lr": 6.340928937170118e-05, "epoch": 1.1146067415730336, "percentage": 37.24, "elapsed_time": "3:22:47", "remaining_time": "5:41:47"}
|
| 125 |
+
{"current_steps": 125, "total_steps": 333, "loss": 0.4587, "lr": 6.30672128845947e-05, "epoch": 1.1235955056179776, "percentage": 37.54, "elapsed_time": "3:24:24", "remaining_time": "5:40:07"}
|
| 126 |
+
{"current_steps": 126, "total_steps": 333, "loss": 0.4527, "lr": 6.272258986924624e-05, "epoch": 1.1325842696629214, "percentage": 37.84, "elapsed_time": "3:26:01", "remaining_time": "5:38:28"}
|
| 127 |
+
{"current_steps": 127, "total_steps": 333, "loss": 0.4518, "lr": 6.237545837066133e-05, "epoch": 1.1415730337078651, "percentage": 38.14, "elapsed_time": "3:27:38", "remaining_time": "5:36:48"}
|
| 128 |
+
{"current_steps": 128, "total_steps": 333, "loss": 0.4474, "lr": 6.202585671077204e-05, "epoch": 1.1505617977528089, "percentage": 38.44, "elapsed_time": "3:29:15", "remaining_time": "5:35:08"}
|
| 129 |
+
{"current_steps": 129, "total_steps": 333, "loss": 0.4573, "lr": 6.167382348420637e-05, "epoch": 1.1595505617977528, "percentage": 38.74, "elapsed_time": "3:30:52", "remaining_time": "5:33:28"}
|
| 130 |
+
{"current_steps": 130, "total_steps": 333, "loss": 0.4551, "lr": 6.131939755402755e-05, "epoch": 1.1685393258426966, "percentage": 39.04, "elapsed_time": "3:32:29", "remaining_time": "5:31:48"}
|
| 131 |
+
{"current_steps": 131, "total_steps": 333, "loss": 0.4524, "lr": 6.09626180474438e-05, "epoch": 1.1775280898876406, "percentage": 39.34, "elapsed_time": "3:34:06", "remaining_time": "5:30:08"}
|
| 132 |
+
{"current_steps": 132, "total_steps": 333, "loss": 0.4559, "lr": 6.060352435148874e-05, "epoch": 1.1865168539325843, "percentage": 39.64, "elapsed_time": "3:35:43", "remaining_time": "5:28:29"}
|
| 133 |
+
{"current_steps": 133, "total_steps": 333, "loss": 0.4603, "lr": 6.024215610867327e-05, "epoch": 1.195505617977528, "percentage": 39.94, "elapsed_time": "3:37:20", "remaining_time": "5:26:49"}
|
| 134 |
+
{"current_steps": 134, "total_steps": 333, "loss": 0.4516, "lr": 5.9878553212609184e-05, "epoch": 1.2044943820224718, "percentage": 40.24, "elapsed_time": "3:38:57", "remaining_time": "5:25:10"}
|
| 135 |
+
{"current_steps": 135, "total_steps": 333, "loss": 0.4596, "lr": 5.95127558036051e-05, "epoch": 1.2134831460674158, "percentage": 40.54, "elapsed_time": "3:40:34", "remaining_time": "5:23:30"}
|
| 136 |
+
{"current_steps": 136, "total_steps": 333, "loss": 0.4576, "lr": 5.9144804264235066e-05, "epoch": 1.2224719101123596, "percentage": 40.84, "elapsed_time": "3:42:11", "remaining_time": "5:21:51"}
|
| 137 |
+
{"current_steps": 137, "total_steps": 333, "loss": 0.4602, "lr": 5.8774739214880554e-05, "epoch": 1.2314606741573033, "percentage": 41.14, "elapsed_time": "3:43:48", "remaining_time": "5:20:11"}
|
| 138 |
+
{"current_steps": 138, "total_steps": 333, "loss": 0.45, "lr": 5.840260150924609e-05, "epoch": 1.2404494382022473, "percentage": 41.44, "elapsed_time": "3:45:25", "remaining_time": "5:18:32"}
|
| 139 |
+
{"current_steps": 139, "total_steps": 333, "loss": 0.4564, "lr": 5.802843222984919e-05, "epoch": 1.249438202247191, "percentage": 41.74, "elapsed_time": "3:47:02", "remaining_time": "5:16:52"}
|
| 140 |
+
{"current_steps": 140, "total_steps": 333, "loss": 0.4533, "lr": 5.765227268348501e-05, "epoch": 1.2584269662921348, "percentage": 42.04, "elapsed_time": "3:48:39", "remaining_time": "5:15:13"}
|
| 141 |
+
{"current_steps": 141, "total_steps": 333, "loss": 0.457, "lr": 5.727416439666622e-05, "epoch": 1.2674157303370785, "percentage": 42.34, "elapsed_time": "3:50:16", "remaining_time": "5:13:34"}
|
| 142 |
+
{"current_steps": 142, "total_steps": 333, "loss": 0.4516, "lr": 5.689414911103867e-05, "epoch": 1.2764044943820225, "percentage": 42.64, "elapsed_time": "3:51:54", "remaining_time": "5:11:55"}
|
| 143 |
+
{"current_steps": 143, "total_steps": 333, "loss": 0.4556, "lr": 5.651226877877326e-05, "epoch": 1.2853932584269663, "percentage": 42.94, "elapsed_time": "3:53:30", "remaining_time": "5:10:16"}
|
| 144 |
+
{"current_steps": 144, "total_steps": 333, "loss": 0.4554, "lr": 5.612856555793459e-05, "epoch": 1.29438202247191, "percentage": 43.24, "elapsed_time": "3:55:07", "remaining_time": "5:08:36"}
|
| 145 |
+
{"current_steps": 145, "total_steps": 333, "loss": 0.4491, "lr": 5.574308180782693e-05, "epoch": 1.303370786516854, "percentage": 43.54, "elapsed_time": "3:56:44", "remaining_time": "5:06:57"}
|
| 146 |
+
{"current_steps": 146, "total_steps": 333, "loss": 0.4575, "lr": 5.5355860084317787e-05, "epoch": 1.3123595505617978, "percentage": 43.84, "elapsed_time": "3:58:21", "remaining_time": "5:05:18"}
|
| 147 |
+
{"current_steps": 147, "total_steps": 333, "loss": 0.4536, "lr": 5.496694313514009e-05, "epoch": 1.3213483146067415, "percentage": 44.14, "elapsed_time": "3:59:58", "remaining_time": "5:03:38"}
|
| 148 |
+
{"current_steps": 148, "total_steps": 333, "loss": 0.4616, "lr": 5.457637389517285e-05, "epoch": 1.3303370786516853, "percentage": 44.44, "elapsed_time": "4:01:35", "remaining_time": "5:01:59"}
|
| 149 |
+
{"current_steps": 149, "total_steps": 333, "loss": 0.4474, "lr": 5.4184195481701425e-05, "epoch": 1.3393258426966292, "percentage": 44.74, "elapsed_time": "4:03:12", "remaining_time": "5:00:20"}
|
| 150 |
+
{"current_steps": 150, "total_steps": 333, "loss": 0.4511, "lr": 5.3790451189657486e-05, "epoch": 1.348314606741573, "percentage": 45.05, "elapsed_time": "4:04:49", "remaining_time": "4:58:41"}
|
| 151 |
+
{"current_steps": 151, "total_steps": 333, "loss": 0.4514, "lr": 5.339518448683945e-05, "epoch": 1.357303370786517, "percentage": 45.35, "elapsed_time": "4:06:26", "remaining_time": "4:57:02"}
|
| 152 |
+
{"current_steps": 152, "total_steps": 333, "loss": 0.4522, "lr": 5.2998439009113814e-05, "epoch": 1.3662921348314607, "percentage": 45.65, "elapsed_time": "4:08:03", "remaining_time": "4:55:23"}
|
| 153 |
+
{"current_steps": 153, "total_steps": 333, "loss": 0.457, "lr": 5.260025855559792e-05, "epoch": 1.3752808988764045, "percentage": 45.95, "elapsed_time": "4:09:40", "remaining_time": "4:53:44"}
|
| 154 |
+
{"current_steps": 154, "total_steps": 333, "loss": 0.4501, "lr": 5.2200687083824706e-05, "epoch": 1.3842696629213482, "percentage": 46.25, "elapsed_time": "4:11:17", "remaining_time": "4:52:04"}
|
| 155 |
+
{"current_steps": 155, "total_steps": 333, "loss": 0.4508, "lr": 5.179976870488999e-05, "epoch": 1.3932584269662922, "percentage": 46.55, "elapsed_time": "4:12:53", "remaining_time": "4:50:25"}
|
| 156 |
+
{"current_steps": 156, "total_steps": 333, "loss": 0.4507, "lr": 5.1397547678582745e-05, "epoch": 1.402247191011236, "percentage": 46.85, "elapsed_time": "4:14:30", "remaining_time": "4:48:46"}
|
| 157 |
+
{"current_steps": 157, "total_steps": 333, "loss": 0.4535, "lr": 5.099406840849902e-05, "epoch": 1.4112359550561797, "percentage": 47.15, "elapsed_time": "4:16:07", "remaining_time": "4:47:07"}
|
| 158 |
+
{"current_steps": 158, "total_steps": 333, "loss": 0.4436, "lr": 5.058937543713999e-05, "epoch": 1.4202247191011237, "percentage": 47.45, "elapsed_time": "4:17:44", "remaining_time": "4:45:28"}
|
| 159 |
+
{"current_steps": 159, "total_steps": 333, "loss": 0.4532, "lr": 5.018351344099453e-05, "epoch": 1.4292134831460674, "percentage": 47.75, "elapsed_time": "4:19:21", "remaining_time": "4:43:49"}
|
| 160 |
+
{"current_steps": 160, "total_steps": 333, "loss": 0.4511, "lr": 4.9776527225607274e-05, "epoch": 1.4382022471910112, "percentage": 48.05, "elapsed_time": "4:20:58", "remaining_time": "4:42:11"}
|
| 161 |
+
{"current_steps": 161, "total_steps": 333, "loss": 0.4485, "lr": 4.93684617206321e-05, "epoch": 1.447191011235955, "percentage": 48.35, "elapsed_time": "4:22:35", "remaining_time": "4:40:32"}
|
| 162 |
+
{"current_steps": 162, "total_steps": 333, "loss": 0.4481, "lr": 4.89593619748722e-05, "epoch": 1.456179775280899, "percentage": 48.65, "elapsed_time": "4:24:12", "remaining_time": "4:38:53"}
|
| 163 |
+
{"current_steps": 163, "total_steps": 333, "loss": 0.4446, "lr": 4.8549273151306795e-05, "epoch": 1.4651685393258427, "percentage": 48.95, "elapsed_time": "4:25:49", "remaining_time": "4:37:14"}
|
| 164 |
+
{"current_steps": 164, "total_steps": 333, "loss": 0.4516, "lr": 4.8138240522105365e-05, "epoch": 1.4741573033707867, "percentage": 49.25, "elapsed_time": "4:27:26", "remaining_time": "4:35:35"}
|
| 165 |
+
{"current_steps": 165, "total_steps": 333, "loss": 0.439, "lr": 4.7726309463629733e-05, "epoch": 1.4831460674157304, "percentage": 49.55, "elapsed_time": "4:29:03", "remaining_time": "4:33:57"}
|
| 166 |
+
{"current_steps": 166, "total_steps": 333, "loss": 0.449, "lr": 4.731352545142478e-05, "epoch": 1.4921348314606742, "percentage": 49.85, "elapsed_time": "4:30:40", "remaining_time": "4:32:18"}
|
| 167 |
+
{"current_steps": 167, "total_steps": 333, "loss": 0.4433, "lr": 4.689993405519802e-05, "epoch": 1.501123595505618, "percentage": 50.15, "elapsed_time": "4:32:17", "remaining_time": "4:30:40"}
|
| 168 |
+
{"current_steps": 168, "total_steps": 333, "loss": 0.4501, "lr": 4.648558093378899e-05, "epoch": 1.5101123595505617, "percentage": 50.45, "elapsed_time": "4:33:54", "remaining_time": "4:29:01"}
|
| 169 |
+
{"current_steps": 169, "total_steps": 333, "loss": 0.4422, "lr": 4.607051183012862e-05, "epoch": 1.5191011235955056, "percentage": 50.75, "elapsed_time": "4:35:31", "remaining_time": "4:27:22"}
|
| 170 |
+
{"current_steps": 170, "total_steps": 333, "loss": 0.4439, "lr": 4.5654772566189415e-05, "epoch": 1.5280898876404494, "percentage": 51.05, "elapsed_time": "4:37:08", "remaining_time": "4:25:44"}
|
| 171 |
+
{"current_steps": 171, "total_steps": 333, "loss": 0.4464, "lr": 4.5238409037926905e-05, "epoch": 1.5370786516853934, "percentage": 51.35, "elapsed_time": "4:38:45", "remaining_time": "4:24:05"}
|
| 172 |
+
{"current_steps": 172, "total_steps": 333, "loss": 0.4515, "lr": 4.4821467210212924e-05, "epoch": 1.5460674157303371, "percentage": 51.65, "elapsed_time": "4:40:22", "remaining_time": "4:22:26"}
|
| 173 |
+
{"current_steps": 173, "total_steps": 333, "loss": 0.4487, "lr": 4.4403993111761265e-05, "epoch": 1.5550561797752809, "percentage": 51.95, "elapsed_time": "4:41:59", "remaining_time": "4:20:48"}
|
| 174 |
+
{"current_steps": 174, "total_steps": 333, "loss": 0.4349, "lr": 4.398603283004626e-05, "epoch": 1.5640449438202246, "percentage": 52.25, "elapsed_time": "4:43:36", "remaining_time": "4:19:09"}
|
| 175 |
+
{"current_steps": 175, "total_steps": 333, "loss": 0.439, "lr": 4.356763250621496e-05, "epoch": 1.5730337078651684, "percentage": 52.55, "elapsed_time": "4:45:13", "remaining_time": "4:17:31"}
|
| 176 |
+
{"current_steps": 176, "total_steps": 333, "loss": 0.4399, "lr": 4.314883832999326e-05, "epoch": 1.5820224719101124, "percentage": 52.85, "elapsed_time": "4:46:50", "remaining_time": "4:15:52"}
|
| 177 |
+
{"current_steps": 177, "total_steps": 333, "loss": 0.449, "lr": 4.272969653458685e-05, "epoch": 1.5910112359550563, "percentage": 53.15, "elapsed_time": "4:48:27", "remaining_time": "4:14:13"}
|
| 178 |
+
{"current_steps": 178, "total_steps": 333, "loss": 0.4368, "lr": 4.231025339157714e-05, "epoch": 1.6, "percentage": 53.45, "elapsed_time": "4:50:04", "remaining_time": "4:12:35"}
|
| 179 |
+
{"current_steps": 179, "total_steps": 333, "loss": 0.4447, "lr": 4.189055520581315e-05, "epoch": 1.6089887640449438, "percentage": 53.75, "elapsed_time": "4:51:40", "remaining_time": "4:10:56"}
|
| 180 |
+
{"current_steps": 180, "total_steps": 333, "loss": 0.445, "lr": 4.147064831029959e-05, "epoch": 1.6179775280898876, "percentage": 54.05, "elapsed_time": "4:53:17", "remaining_time": "4:09:17"}
|
| 181 |
+
{"current_steps": 181, "total_steps": 333, "loss": 0.4452, "lr": 4.105057906108189e-05, "epoch": 1.6269662921348313, "percentage": 54.35, "elapsed_time": "4:54:54", "remaining_time": "4:07:39"}
|
| 182 |
+
{"current_steps": 182, "total_steps": 333, "loss": 0.4425, "lr": 4.063039383212866e-05, "epoch": 1.6359550561797753, "percentage": 54.65, "elapsed_time": "4:56:31", "remaining_time": "4:06:00"}
|
| 183 |
+
{"current_steps": 183, "total_steps": 333, "loss": 0.4411, "lr": 4.021013901021225e-05, "epoch": 1.644943820224719, "percentage": 54.95, "elapsed_time": "4:58:08", "remaining_time": "4:04:22"}
|
| 184 |
+
{"current_steps": 184, "total_steps": 333, "loss": 0.4517, "lr": 3.978986098978777e-05, "epoch": 1.653932584269663, "percentage": 55.26, "elapsed_time": "4:59:45", "remaining_time": "4:02:44"}
|
| 185 |
+
{"current_steps": 185, "total_steps": 333, "loss": 0.4446, "lr": 3.936960616787135e-05, "epoch": 1.6629213483146068, "percentage": 55.56, "elapsed_time": "5:01:22", "remaining_time": "4:01:05"}
|
| 186 |
+
{"current_steps": 186, "total_steps": 333, "loss": 0.4364, "lr": 3.8949420938918124e-05, "epoch": 1.6719101123595506, "percentage": 55.86, "elapsed_time": "5:02:58", "remaining_time": "3:59:27"}
|
| 187 |
+
{"current_steps": 187, "total_steps": 333, "loss": 0.4357, "lr": 3.852935168970042e-05, "epoch": 1.6808988764044943, "percentage": 56.16, "elapsed_time": "5:04:35", "remaining_time": "3:57:48"}
|
| 188 |
+
{"current_steps": 188, "total_steps": 333, "loss": 0.4399, "lr": 3.810944479418686e-05, "epoch": 1.689887640449438, "percentage": 56.46, "elapsed_time": "5:06:12", "remaining_time": "3:56:10"}
|
| 189 |
+
{"current_steps": 189, "total_steps": 333, "loss": 0.4475, "lr": 3.768974660842287e-05, "epoch": 1.698876404494382, "percentage": 56.76, "elapsed_time": "5:07:49", "remaining_time": "3:54:31"}
|
| 190 |
+
{"current_steps": 190, "total_steps": 333, "loss": 0.437, "lr": 3.727030346541317e-05, "epoch": 1.7078651685393258, "percentage": 57.06, "elapsed_time": "5:09:26", "remaining_time": "3:52:53"}
|
| 191 |
+
{"current_steps": 191, "total_steps": 333, "loss": 0.4376, "lr": 3.685116167000675e-05, "epoch": 1.7168539325842698, "percentage": 57.36, "elapsed_time": "5:11:03", "remaining_time": "3:51:15"}
|
| 192 |
+
{"current_steps": 192, "total_steps": 333, "loss": 0.438, "lr": 3.6432367493785056e-05, "epoch": 1.7258426966292135, "percentage": 57.66, "elapsed_time": "5:12:40", "remaining_time": "3:49:36"}
|
| 193 |
+
{"current_steps": 193, "total_steps": 333, "loss": 0.4388, "lr": 3.601396716995375e-05, "epoch": 1.7348314606741573, "percentage": 57.96, "elapsed_time": "5:14:17", "remaining_time": "3:47:58"}
|
| 194 |
+
{"current_steps": 194, "total_steps": 333, "loss": 0.4452, "lr": 3.559600688823875e-05, "epoch": 1.743820224719101, "percentage": 58.26, "elapsed_time": "5:15:53", "remaining_time": "3:46:20"}
|
| 195 |
+
{"current_steps": 195, "total_steps": 333, "loss": 0.442, "lr": 3.517853278978708e-05, "epoch": 1.7528089887640448, "percentage": 58.56, "elapsed_time": "5:17:30", "remaining_time": "3:44:42"}
|
| 196 |
+
{"current_steps": 196, "total_steps": 333, "loss": 0.4437, "lr": 3.4761590962073115e-05, "epoch": 1.7617977528089888, "percentage": 58.86, "elapsed_time": "5:19:07", "remaining_time": "3:43:04"}
|
| 197 |
+
{"current_steps": 197, "total_steps": 333, "loss": 0.4496, "lr": 3.434522743381061e-05, "epoch": 1.7707865168539327, "percentage": 59.16, "elapsed_time": "5:20:44", "remaining_time": "3:41:25"}
|
| 198 |
+
{"current_steps": 198, "total_steps": 333, "loss": 0.4443, "lr": 3.39294881698714e-05, "epoch": 1.7797752808988765, "percentage": 59.46, "elapsed_time": "5:22:21", "remaining_time": "3:39:47"}
|
| 199 |
+
{"current_steps": 199, "total_steps": 333, "loss": 0.4383, "lr": 3.3514419066211025e-05, "epoch": 1.7887640449438202, "percentage": 59.76, "elapsed_time": "5:23:58", "remaining_time": "3:38:09"}
|
| 200 |
+
{"current_steps": 200, "total_steps": 333, "loss": 0.4373, "lr": 3.310006594480199e-05, "epoch": 1.797752808988764, "percentage": 60.06, "elapsed_time": "5:25:35", "remaining_time": "3:36:31"}
|
| 201 |
+
{"current_steps": 201, "total_steps": 333, "loss": 0.4432, "lr": 3.268647454857524e-05, "epoch": 1.8067415730337077, "percentage": 60.36, "elapsed_time": "5:27:12", "remaining_time": "3:34:53"}
|
| 202 |
+
{"current_steps": 202, "total_steps": 333, "loss": 0.4378, "lr": 3.227369053637028e-05, "epoch": 1.8157303370786517, "percentage": 60.66, "elapsed_time": "5:28:49", "remaining_time": "3:33:15"}
|
| 203 |
+
{"current_steps": 203, "total_steps": 333, "loss": 0.4511, "lr": 3.1861759477894656e-05, "epoch": 1.8247191011235955, "percentage": 60.96, "elapsed_time": "5:30:26", "remaining_time": "3:31:36"}
|
| 204 |
+
{"current_steps": 204, "total_steps": 333, "loss": 0.4408, "lr": 3.145072684869322e-05, "epoch": 1.8337078651685395, "percentage": 61.26, "elapsed_time": "5:32:03", "remaining_time": "3:29:58"}
|
| 205 |
+
{"current_steps": 205, "total_steps": 333, "loss": 0.4428, "lr": 3.104063802512782e-05, "epoch": 1.8426966292134832, "percentage": 61.56, "elapsed_time": "5:33:40", "remaining_time": "3:28:20"}
|
| 206 |
+
{"current_steps": 206, "total_steps": 333, "loss": 0.4387, "lr": 3.063153827936792e-05, "epoch": 1.851685393258427, "percentage": 61.86, "elapsed_time": "5:35:17", "remaining_time": "3:26:42"}
|
| 207 |
+
{"current_steps": 207, "total_steps": 333, "loss": 0.4373, "lr": 3.0223472774392753e-05, "epoch": 1.8606741573033707, "percentage": 62.16, "elapsed_time": "5:36:54", "remaining_time": "3:25:04"}
|
| 208 |
+
{"current_steps": 208, "total_steps": 333, "loss": 0.4428, "lr": 2.9816486559005482e-05, "epoch": 1.8696629213483145, "percentage": 62.46, "elapsed_time": "5:38:31", "remaining_time": "3:23:26"}
|
| 209 |
+
{"current_steps": 209, "total_steps": 333, "loss": 0.4374, "lr": 2.9410624562860026e-05, "epoch": 1.8786516853932584, "percentage": 62.76, "elapsed_time": "5:40:08", "remaining_time": "3:21:48"}
|
| 210 |
+
{"current_steps": 210, "total_steps": 333, "loss": 0.4377, "lr": 2.9005931591500974e-05, "epoch": 1.8876404494382022, "percentage": 63.06, "elapsed_time": "5:41:46", "remaining_time": "3:20:10"}
|
| 211 |
+
{"current_steps": 211, "total_steps": 333, "loss": 0.4446, "lr": 2.860245232141726e-05, "epoch": 1.8966292134831462, "percentage": 63.36, "elapsed_time": "5:43:23", "remaining_time": "3:18:33"}
|
| 212 |
+
{"current_steps": 212, "total_steps": 333, "loss": 0.4449, "lr": 2.8200231295110012e-05, "epoch": 1.90561797752809, "percentage": 63.66, "elapsed_time": "5:45:00", "remaining_time": "3:16:54"}
|
| 213 |
+
{"current_steps": 213, "total_steps": 333, "loss": 0.4474, "lr": 2.7799312916175294e-05, "epoch": 1.9146067415730337, "percentage": 63.96, "elapsed_time": "5:46:37", "remaining_time": "3:15:16"}
|
| 214 |
+
{"current_steps": 214, "total_steps": 333, "loss": 0.4396, "lr": 2.7399741444402087e-05, "epoch": 1.9235955056179774, "percentage": 64.26, "elapsed_time": "5:48:14", "remaining_time": "3:13:38"}
|
| 215 |
+
{"current_steps": 215, "total_steps": 333, "loss": 0.432, "lr": 2.7001560990886196e-05, "epoch": 1.9325842696629212, "percentage": 64.56, "elapsed_time": "5:49:51", "remaining_time": "3:12:00"}
|
| 216 |
+
{"current_steps": 216, "total_steps": 333, "loss": 0.4347, "lr": 2.6604815513160556e-05, "epoch": 1.9415730337078652, "percentage": 64.86, "elapsed_time": "5:51:28", "remaining_time": "3:10:23"}
|
| 217 |
+
{"current_steps": 217, "total_steps": 333, "loss": 0.4272, "lr": 2.6209548810342517e-05, "epoch": 1.9505617977528091, "percentage": 65.17, "elapsed_time": "5:53:05", "remaining_time": "3:08:45"}
|
| 218 |
+
{"current_steps": 218, "total_steps": 333, "loss": 0.4373, "lr": 2.5815804518298575e-05, "epoch": 1.9595505617977529, "percentage": 65.47, "elapsed_time": "5:54:43", "remaining_time": "3:07:07"}
|
| 219 |
+
{"current_steps": 219, "total_steps": 333, "loss": 0.4346, "lr": 2.542362610482715e-05, "epoch": 1.9685393258426966, "percentage": 65.77, "elapsed_time": "5:56:20", "remaining_time": "3:05:29"}
|
| 220 |
+
{"current_steps": 220, "total_steps": 333, "loss": 0.444, "lr": 2.503305686485991e-05, "epoch": 1.9775280898876404, "percentage": 66.07, "elapsed_time": "5:57:57", "remaining_time": "3:03:51"}
|
| 221 |
+
{"current_steps": 221, "total_steps": 333, "loss": 0.4413, "lr": 2.464413991568222e-05, "epoch": 1.9865168539325841, "percentage": 66.37, "elapsed_time": "5:59:34", "remaining_time": "3:02:13"}
|
| 222 |
+
{"current_steps": 222, "total_steps": 333, "loss": 0.4383, "lr": 2.4256918192173088e-05, "epoch": 1.9955056179775281, "percentage": 66.67, "elapsed_time": "6:01:10", "remaining_time": "3:00:35"}
|
| 223 |
+
{"current_steps": 223, "total_steps": 333, "loss": 0.7545, "lr": 2.3871434442065414e-05, "epoch": 2.004494382022472, "percentage": 66.97, "elapsed_time": "6:04:22", "remaining_time": "2:59:44"}
|