Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb1dbbaffccdef634895af1dc41094c17a0f9ef6909ae058e0e7a0034c3f9f86
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:63b6be41a886ebf3e7e1f7436f446d726261d5102dc39104a4f244799727bf16
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a9dc8a44f653c13e0c835349e4833604532b152d43fe93f7206b66d81d94df80
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:39e18072a23dfacf537a3e7534df1667202620c989c5d7df0abee04de5678dd0
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -163,3 +163,159 @@
|
|
| 163 |
{"current_steps": 163, "total_steps": 468, "loss": 0.4215, "lr": 3.2963408261694026e-05, "epoch": 1.0415335463258786, "percentage": 34.83, "elapsed_time": "0:57:49", "remaining_time": "1:48:12"}
|
| 164 |
{"current_steps": 164, "total_steps": 468, "loss": 0.4247, "lr": 3.284939954630428e-05, "epoch": 1.0479233226837061, "percentage": 35.04, "elapsed_time": "0:58:12", "remaining_time": "1:47:53"}
|
| 165 |
{"current_steps": 165, "total_steps": 468, "loss": 0.4013, "lr": 3.2734675319820446e-05, "epoch": 1.0543130990415335, "percentage": 35.26, "elapsed_time": "0:58:35", "remaining_time": "1:47:35"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 163 |
{"current_steps": 163, "total_steps": 468, "loss": 0.4215, "lr": 3.2963408261694026e-05, "epoch": 1.0415335463258786, "percentage": 34.83, "elapsed_time": "0:57:49", "remaining_time": "1:48:12"}
|
| 164 |
{"current_steps": 164, "total_steps": 468, "loss": 0.4247, "lr": 3.284939954630428e-05, "epoch": 1.0479233226837061, "percentage": 35.04, "elapsed_time": "0:58:12", "remaining_time": "1:47:53"}
|
| 165 |
{"current_steps": 165, "total_steps": 468, "loss": 0.4013, "lr": 3.2734675319820446e-05, "epoch": 1.0543130990415335, "percentage": 35.26, "elapsed_time": "0:58:35", "remaining_time": "1:47:35"}
|
| 166 |
+
{"current_steps": 166, "total_steps": 468, "loss": 0.4592, "lr": 3.261924197059215e-05, "epoch": 1.060702875399361, "percentage": 35.47, "elapsed_time": "0:58:57", "remaining_time": "1:47:16"}
|
| 167 |
+
{"current_steps": 167, "total_steps": 468, "loss": 0.3779, "lr": 3.25031059264561e-05, "epoch": 1.0670926517571886, "percentage": 35.68, "elapsed_time": "0:59:17", "remaining_time": "1:46:51"}
|
| 168 |
+
{"current_steps": 168, "total_steps": 468, "loss": 0.3354, "lr": 3.2386273654378134e-05, "epoch": 1.073482428115016, "percentage": 35.9, "elapsed_time": "0:59:42", "remaining_time": "1:46:37"}
|
| 169 |
+
{"current_steps": 169, "total_steps": 468, "loss": 0.3658, "lr": 3.226875166009313e-05, "epoch": 1.0798722044728435, "percentage": 36.11, "elapsed_time": "1:00:05", "remaining_time": "1:46:19"}
|
| 170 |
+
{"current_steps": 170, "total_steps": 468, "loss": 0.4916, "lr": 3.215054648774274e-05, "epoch": 1.0862619808306708, "percentage": 36.32, "elapsed_time": "1:00:28", "remaining_time": "1:46:00"}
|
| 171 |
+
{"current_steps": 171, "total_steps": 468, "loss": 0.3829, "lr": 3.2031664719510967e-05, "epoch": 1.0926517571884984, "percentage": 36.54, "elapsed_time": "1:00:48", "remaining_time": "1:45:36"}
|
| 172 |
+
{"current_steps": 172, "total_steps": 468, "loss": 0.4622, "lr": 3.1912112975257664e-05, "epoch": 1.099041533546326, "percentage": 36.75, "elapsed_time": "1:01:12", "remaining_time": "1:45:20"}
|
| 173 |
+
{"current_steps": 173, "total_steps": 468, "loss": 0.3948, "lr": 3.1791897912149874e-05, "epoch": 1.1054313099041533, "percentage": 36.97, "elapsed_time": "1:01:35", "remaining_time": "1:45:02"}
|
| 174 |
+
{"current_steps": 174, "total_steps": 468, "loss": 0.364, "lr": 3.167102622429117e-05, "epoch": 1.1118210862619808, "percentage": 37.18, "elapsed_time": "1:01:57", "remaining_time": "1:44:41"}
|
| 175 |
+
{"current_steps": 175, "total_steps": 468, "loss": 0.3855, "lr": 3.1549504642348856e-05, "epoch": 1.1182108626198084, "percentage": 37.39, "elapsed_time": "1:02:18", "remaining_time": "1:44:20"}
|
| 176 |
+
{"current_steps": 176, "total_steps": 468, "loss": 0.3966, "lr": 3.142733993317924e-05, "epoch": 1.1246006389776357, "percentage": 37.61, "elapsed_time": "1:02:39", "remaining_time": "1:43:56"}
|
| 177 |
+
{"current_steps": 177, "total_steps": 468, "loss": 0.4024, "lr": 3.130453889945075e-05, "epoch": 1.1309904153354633, "percentage": 37.82, "elapsed_time": "1:03:02", "remaining_time": "1:43:37"}
|
| 178 |
+
{"current_steps": 178, "total_steps": 468, "loss": 0.3553, "lr": 3.118110837926517e-05, "epoch": 1.1373801916932909, "percentage": 38.03, "elapsed_time": "1:03:19", "remaining_time": "1:43:10"}
|
| 179 |
+
{"current_steps": 179, "total_steps": 468, "loss": 0.4578, "lr": 3.105705524577686e-05, "epoch": 1.1437699680511182, "percentage": 38.25, "elapsed_time": "1:03:42", "remaining_time": "1:42:51"}
|
| 180 |
+
{"current_steps": 180, "total_steps": 468, "loss": 0.3781, "lr": 3.093238640681003e-05, "epoch": 1.1501597444089458, "percentage": 38.46, "elapsed_time": "1:04:03", "remaining_time": "1:42:28"}
|
| 181 |
+
{"current_steps": 181, "total_steps": 468, "loss": 0.3887, "lr": 3.080710880447408e-05, "epoch": 1.156549520766773, "percentage": 38.68, "elapsed_time": "1:04:22", "remaining_time": "1:42:05"}
|
| 182 |
+
{"current_steps": 182, "total_steps": 468, "loss": 0.4388, "lr": 3.068122941477704e-05, "epoch": 1.1629392971246006, "percentage": 38.89, "elapsed_time": "1:04:45", "remaining_time": "1:41:46"}
|
| 183 |
+
{"current_steps": 183, "total_steps": 468, "loss": 0.3889, "lr": 3.05547552472371e-05, "epoch": 1.1693290734824282, "percentage": 39.1, "elapsed_time": "1:05:03", "remaining_time": "1:41:19"}
|
| 184 |
+
{"current_steps": 184, "total_steps": 468, "loss": 0.4279, "lr": 3.0427693344492278e-05, "epoch": 1.1757188498402555, "percentage": 39.32, "elapsed_time": "1:05:22", "remaining_time": "1:40:54"}
|
| 185 |
+
{"current_steps": 185, "total_steps": 468, "loss": 0.3517, "lr": 3.0300050781908305e-05, "epoch": 1.182108626198083, "percentage": 39.53, "elapsed_time": "1:05:43", "remaining_time": "1:40:33"}
|
| 186 |
+
{"current_steps": 186, "total_steps": 468, "loss": 0.3922, "lr": 3.0171834667184597e-05, "epoch": 1.1884984025559104, "percentage": 39.74, "elapsed_time": "1:06:05", "remaining_time": "1:40:12"}
|
| 187 |
+
{"current_steps": 187, "total_steps": 468, "loss": 0.4332, "lr": 3.0043052139958465e-05, "epoch": 1.194888178913738, "percentage": 39.96, "elapsed_time": "1:06:26", "remaining_time": "1:39:50"}
|
| 188 |
+
{"current_steps": 188, "total_steps": 468, "loss": 0.3973, "lr": 2.9913710371407574e-05, "epoch": 1.2012779552715656, "percentage": 40.17, "elapsed_time": "1:06:47", "remaining_time": "1:39:28"}
|
| 189 |
+
{"current_steps": 189, "total_steps": 468, "loss": 0.3988, "lr": 2.97838165638506e-05, "epoch": 1.207667731629393, "percentage": 40.38, "elapsed_time": "1:07:10", "remaining_time": "1:39:10"}
|
| 190 |
+
{"current_steps": 190, "total_steps": 468, "loss": 0.4124, "lr": 2.965337795034617e-05, "epoch": 1.2140575079872205, "percentage": 40.6, "elapsed_time": "1:07:28", "remaining_time": "1:38:43"}
|
| 191 |
+
{"current_steps": 191, "total_steps": 468, "loss": 0.478, "lr": 2.9522401794290127e-05, "epoch": 1.220447284345048, "percentage": 40.81, "elapsed_time": "1:07:49", "remaining_time": "1:38:22"}
|
| 192 |
+
{"current_steps": 192, "total_steps": 468, "loss": 0.3373, "lr": 2.9390895389011024e-05, "epoch": 1.2268370607028753, "percentage": 41.03, "elapsed_time": "1:08:05", "remaining_time": "1:37:53"}
|
| 193 |
+
{"current_steps": 193, "total_steps": 468, "loss": 0.481, "lr": 2.9258866057364028e-05, "epoch": 1.233226837060703, "percentage": 41.24, "elapsed_time": "1:08:26", "remaining_time": "1:37:30"}
|
| 194 |
+
{"current_steps": 194, "total_steps": 468, "loss": 0.3599, "lr": 2.912632115132316e-05, "epoch": 1.2396166134185305, "percentage": 41.45, "elapsed_time": "1:08:49", "remaining_time": "1:37:11"}
|
| 195 |
+
{"current_steps": 195, "total_steps": 468, "loss": 0.4054, "lr": 2.8993268051571877e-05, "epoch": 1.2460063897763578, "percentage": 41.67, "elapsed_time": "1:09:13", "remaining_time": "1:36:55"}
|
| 196 |
+
{"current_steps": 196, "total_steps": 468, "loss": 0.4582, "lr": 2.885971416709211e-05, "epoch": 1.2523961661341854, "percentage": 41.88, "elapsed_time": "1:09:36", "remaining_time": "1:36:35"}
|
| 197 |
+
{"current_steps": 197, "total_steps": 468, "loss": 0.3904, "lr": 2.8725666934751678e-05, "epoch": 1.2587859424920127, "percentage": 42.09, "elapsed_time": "1:09:55", "remaining_time": "1:36:11"}
|
| 198 |
+
{"current_steps": 198, "total_steps": 468, "loss": 0.3776, "lr": 2.859113381889018e-05, "epoch": 1.2651757188498403, "percentage": 42.31, "elapsed_time": "1:10:14", "remaining_time": "1:35:46"}
|
| 199 |
+
{"current_steps": 199, "total_steps": 468, "loss": 0.3869, "lr": 2.8456122310903342e-05, "epoch": 1.2715654952076676, "percentage": 42.52, "elapsed_time": "1:10:34", "remaining_time": "1:35:24"}
|
| 200 |
+
{"current_steps": 200, "total_steps": 468, "loss": 0.4434, "lr": 2.8320639928825885e-05, "epoch": 1.2779552715654952, "percentage": 42.74, "elapsed_time": "1:10:57", "remaining_time": "1:35:05"}
|
| 201 |
+
{"current_steps": 201, "total_steps": 468, "loss": 0.4034, "lr": 2.818469421691285e-05, "epoch": 1.2843450479233227, "percentage": 42.95, "elapsed_time": "1:11:21", "remaining_time": "1:34:47"}
|
| 202 |
+
{"current_steps": 202, "total_steps": 468, "loss": 0.4592, "lr": 2.804829274521954e-05, "epoch": 1.29073482428115, "percentage": 43.16, "elapsed_time": "1:11:42", "remaining_time": "1:34:26"}
|
| 203 |
+
{"current_steps": 203, "total_steps": 468, "loss": 0.4018, "lr": 2.7911443109179958e-05, "epoch": 1.2971246006389776, "percentage": 43.38, "elapsed_time": "1:12:04", "remaining_time": "1:34:05"}
|
| 204 |
+
{"current_steps": 204, "total_steps": 468, "loss": 0.3987, "lr": 2.777415292918386e-05, "epoch": 1.3035143769968052, "percentage": 43.59, "elapsed_time": "1:12:27", "remaining_time": "1:33:46"}
|
| 205 |
+
{"current_steps": 205, "total_steps": 468, "loss": 0.3931, "lr": 2.7636429850152452e-05, "epoch": 1.3099041533546325, "percentage": 43.8, "elapsed_time": "1:12:50", "remaining_time": "1:33:27"}
|
| 206 |
+
{"current_steps": 206, "total_steps": 468, "loss": 0.406, "lr": 2.7498281541112645e-05, "epoch": 1.31629392971246, "percentage": 44.02, "elapsed_time": "1:13:11", "remaining_time": "1:33:04"}
|
| 207 |
+
{"current_steps": 207, "total_steps": 468, "loss": 0.3969, "lr": 2.735971569477002e-05, "epoch": 1.3226837060702876, "percentage": 44.23, "elapsed_time": "1:13:33", "remaining_time": "1:32:44"}
|
| 208 |
+
{"current_steps": 208, "total_steps": 468, "loss": 0.4243, "lr": 2.72207400270805e-05, "epoch": 1.329073482428115, "percentage": 44.44, "elapsed_time": "1:13:51", "remaining_time": "1:32:19"}
|
| 209 |
+
{"current_steps": 209, "total_steps": 468, "loss": 0.3745, "lr": 2.7081362276820634e-05, "epoch": 1.3354632587859425, "percentage": 44.66, "elapsed_time": "1:14:13", "remaining_time": "1:31:58"}
|
| 210 |
+
{"current_steps": 210, "total_steps": 468, "loss": 0.4768, "lr": 2.6941590205156715e-05, "epoch": 1.34185303514377, "percentage": 44.87, "elapsed_time": "1:14:34", "remaining_time": "1:31:37"}
|
| 211 |
+
{"current_steps": 211, "total_steps": 468, "loss": 0.3741, "lr": 2.6801431595212585e-05, "epoch": 1.3482428115015974, "percentage": 45.09, "elapsed_time": "1:14:52", "remaining_time": "1:31:12"}
|
| 212 |
+
{"current_steps": 212, "total_steps": 468, "loss": 0.4173, "lr": 2.666089425163623e-05, "epoch": 1.354632587859425, "percentage": 45.3, "elapsed_time": "1:15:13", "remaining_time": "1:30:50"}
|
| 213 |
+
{"current_steps": 213, "total_steps": 468, "loss": 0.3851, "lr": 2.6519986000165197e-05, "epoch": 1.3610223642172525, "percentage": 45.51, "elapsed_time": "1:15:36", "remaining_time": "1:30:30"}
|
| 214 |
+
{"current_steps": 214, "total_steps": 468, "loss": 0.3976, "lr": 2.637871468719081e-05, "epoch": 1.3674121405750799, "percentage": 45.73, "elapsed_time": "1:15:58", "remaining_time": "1:30:10"}
|
| 215 |
+
{"current_steps": 215, "total_steps": 468, "loss": 0.3557, "lr": 2.623708817932127e-05, "epoch": 1.3738019169329074, "percentage": 45.94, "elapsed_time": "1:16:19", "remaining_time": "1:29:49"}
|
| 216 |
+
{"current_steps": 216, "total_steps": 468, "loss": 0.3675, "lr": 2.6095114362943567e-05, "epoch": 1.3801916932907348, "percentage": 46.15, "elapsed_time": "1:16:42", "remaining_time": "1:29:29"}
|
| 217 |
+
{"current_steps": 217, "total_steps": 468, "loss": 0.4192, "lr": 2.5952801143784377e-05, "epoch": 1.3865814696485623, "percentage": 46.37, "elapsed_time": "1:17:04", "remaining_time": "1:29:09"}
|
| 218 |
+
{"current_steps": 218, "total_steps": 468, "loss": 0.3929, "lr": 2.5810156446469815e-05, "epoch": 1.3929712460063897, "percentage": 46.58, "elapsed_time": "1:17:24", "remaining_time": "1:28:46"}
|
| 219 |
+
{"current_steps": 219, "total_steps": 468, "loss": 0.4085, "lr": 2.5667188214084156e-05, "epoch": 1.3993610223642172, "percentage": 46.79, "elapsed_time": "1:17:47", "remaining_time": "1:28:27"}
|
| 220 |
+
{"current_steps": 220, "total_steps": 468, "loss": 0.4069, "lr": 2.5523904407727518e-05, "epoch": 1.4057507987220448, "percentage": 47.01, "elapsed_time": "1:18:08", "remaining_time": "1:28:05"}
|
| 221 |
+
{"current_steps": 221, "total_steps": 468, "loss": 0.3844, "lr": 2.5380313006072576e-05, "epoch": 1.4121405750798721, "percentage": 47.22, "elapsed_time": "1:18:32", "remaining_time": "1:27:46"}
|
| 222 |
+
{"current_steps": 222, "total_steps": 468, "loss": 0.4525, "lr": 2.523642200492027e-05, "epoch": 1.4185303514376997, "percentage": 47.44, "elapsed_time": "1:18:54", "remaining_time": "1:27:26"}
|
| 223 |
+
{"current_steps": 223, "total_steps": 468, "loss": 0.3858, "lr": 2.5092239416754545e-05, "epoch": 1.4249201277955272, "percentage": 47.65, "elapsed_time": "1:19:15", "remaining_time": "1:27:04"}
|
| 224 |
+
{"current_steps": 224, "total_steps": 468, "loss": 0.4076, "lr": 2.4947773270296218e-05, "epoch": 1.4313099041533546, "percentage": 47.86, "elapsed_time": "1:19:34", "remaining_time": "1:26:40"}
|
| 225 |
+
{"current_steps": 225, "total_steps": 468, "loss": 0.4116, "lr": 2.4803031610055847e-05, "epoch": 1.4376996805111821, "percentage": 48.08, "elapsed_time": "1:19:53", "remaining_time": "1:26:17"}
|
| 226 |
+
{"current_steps": 226, "total_steps": 468, "loss": 0.3701, "lr": 2.465802249588583e-05, "epoch": 1.4440894568690097, "percentage": 48.29, "elapsed_time": "1:20:14", "remaining_time": "1:25:55"}
|
| 227 |
+
{"current_steps": 227, "total_steps": 468, "loss": 0.3497, "lr": 2.451275400253157e-05, "epoch": 1.450479233226837, "percentage": 48.5, "elapsed_time": "1:20:30", "remaining_time": "1:25:28"}
|
| 228 |
+
{"current_steps": 228, "total_steps": 468, "loss": 0.4835, "lr": 2.436723421918185e-05, "epoch": 1.4568690095846646, "percentage": 48.72, "elapsed_time": "1:20:53", "remaining_time": "1:25:08"}
|
| 229 |
+
{"current_steps": 229, "total_steps": 468, "loss": 0.373, "lr": 2.4221471249018368e-05, "epoch": 1.4632587859424921, "percentage": 48.93, "elapsed_time": "1:21:10", "remaining_time": "1:24:43"}
|
| 230 |
+
{"current_steps": 230, "total_steps": 468, "loss": 0.3923, "lr": 2.4075473208764558e-05, "epoch": 1.4696485623003195, "percentage": 49.15, "elapsed_time": "1:21:31", "remaining_time": "1:24:22"}
|
| 231 |
+
{"current_steps": 231, "total_steps": 468, "loss": 0.3575, "lr": 2.392924822823357e-05, "epoch": 1.476038338658147, "percentage": 49.36, "elapsed_time": "1:21:52", "remaining_time": "1:23:59"}
|
| 232 |
+
{"current_steps": 232, "total_steps": 468, "loss": 0.4385, "lr": 2.378280444987561e-05, "epoch": 1.4824281150159744, "percentage": 49.57, "elapsed_time": "1:22:12", "remaining_time": "1:23:37"}
|
| 233 |
+
{"current_steps": 233, "total_steps": 468, "loss": 0.3372, "lr": 2.3636150028324486e-05, "epoch": 1.488817891373802, "percentage": 49.79, "elapsed_time": "1:22:35", "remaining_time": "1:23:17"}
|
| 234 |
+
{"current_steps": 234, "total_steps": 468, "loss": 0.4001, "lr": 2.3489293129943555e-05, "epoch": 1.4952076677316293, "percentage": 50.0, "elapsed_time": "1:22:59", "remaining_time": "1:22:59"}
|
| 235 |
+
{"current_steps": 235, "total_steps": 468, "loss": 0.4067, "lr": 2.334224193237097e-05, "epoch": 1.5015974440894568, "percentage": 50.21, "elapsed_time": "1:23:20", "remaining_time": "1:22:38"}
|
| 236 |
+
{"current_steps": 236, "total_steps": 468, "loss": 0.3842, "lr": 2.319500462406434e-05, "epoch": 1.5079872204472844, "percentage": 50.43, "elapsed_time": "1:23:41", "remaining_time": "1:22:16"}
|
| 237 |
+
{"current_steps": 237, "total_steps": 468, "loss": 0.4108, "lr": 2.3047589403844702e-05, "epoch": 1.5143769968051117, "percentage": 50.64, "elapsed_time": "1:24:01", "remaining_time": "1:21:53"}
|
| 238 |
+
{"current_steps": 238, "total_steps": 468, "loss": 0.3344, "lr": 2.290000448044004e-05, "epoch": 1.5207667731629393, "percentage": 50.85, "elapsed_time": "1:24:21", "remaining_time": "1:21:31"}
|
| 239 |
+
{"current_steps": 239, "total_steps": 468, "loss": 0.4079, "lr": 2.2752258072028145e-05, "epoch": 1.5271565495207668, "percentage": 51.07, "elapsed_time": "1:24:42", "remaining_time": "1:21:09"}
|
| 240 |
+
{"current_steps": 240, "total_steps": 468, "loss": 0.3711, "lr": 2.260435840577901e-05, "epoch": 1.5335463258785942, "percentage": 51.28, "elapsed_time": "1:25:05", "remaining_time": "1:20:50"}
|
| 241 |
+
{"current_steps": 241, "total_steps": 468, "loss": 0.4798, "lr": 2.245631371739669e-05, "epoch": 1.5399361022364217, "percentage": 51.5, "elapsed_time": "1:25:25", "remaining_time": "1:20:27"}
|
| 242 |
+
{"current_steps": 242, "total_steps": 468, "loss": 0.3586, "lr": 2.2308132250660717e-05, "epoch": 1.5463258785942493, "percentage": 51.71, "elapsed_time": "1:25:44", "remaining_time": "1:20:04"}
|
| 243 |
+
{"current_steps": 243, "total_steps": 468, "loss": 0.341, "lr": 2.215982225696704e-05, "epoch": 1.5527156549520766, "percentage": 51.92, "elapsed_time": "1:26:02", "remaining_time": "1:19:39"}
|
| 244 |
+
{"current_steps": 244, "total_steps": 468, "loss": 0.3927, "lr": 2.201139199486856e-05, "epoch": 1.5591054313099042, "percentage": 52.14, "elapsed_time": "1:26:25", "remaining_time": "1:19:20"}
|
| 245 |
+
{"current_steps": 245, "total_steps": 468, "loss": 0.4049, "lr": 2.186284972961525e-05, "epoch": 1.5654952076677318, "percentage": 52.35, "elapsed_time": "1:26:48", "remaining_time": "1:19:00"}
|
| 246 |
+
{"current_steps": 246, "total_steps": 468, "loss": 0.3493, "lr": 2.1714203732693905e-05, "epoch": 1.571884984025559, "percentage": 52.56, "elapsed_time": "1:27:08", "remaining_time": "1:18:38"}
|
| 247 |
+
{"current_steps": 247, "total_steps": 468, "loss": 0.446, "lr": 2.1565462281367572e-05, "epoch": 1.5782747603833864, "percentage": 52.78, "elapsed_time": "1:27:29", "remaining_time": "1:18:16"}
|
| 248 |
+
{"current_steps": 248, "total_steps": 468, "loss": 0.3761, "lr": 2.141663365821459e-05, "epoch": 1.5846645367412142, "percentage": 52.99, "elapsed_time": "1:27:48", "remaining_time": "1:17:53"}
|
| 249 |
+
{"current_steps": 249, "total_steps": 468, "loss": 0.4227, "lr": 2.1267726150667426e-05, "epoch": 1.5910543130990416, "percentage": 53.21, "elapsed_time": "1:28:07", "remaining_time": "1:17:30"}
|
| 250 |
+
{"current_steps": 250, "total_steps": 468, "loss": 0.4185, "lr": 2.1118748050551194e-05, "epoch": 1.5974440894568689, "percentage": 53.42, "elapsed_time": "1:28:26", "remaining_time": "1:17:07"}
|
| 251 |
+
{"current_steps": 251, "total_steps": 468, "loss": 0.335, "lr": 2.0969707653621884e-05, "epoch": 1.6038338658146964, "percentage": 53.63, "elapsed_time": "1:28:47", "remaining_time": "1:16:45"}
|
| 252 |
+
{"current_steps": 252, "total_steps": 468, "loss": 0.4249, "lr": 2.0820613259104462e-05, "epoch": 1.610223642172524, "percentage": 53.85, "elapsed_time": "1:29:09", "remaining_time": "1:16:25"}
|
| 253 |
+
{"current_steps": 253, "total_steps": 468, "loss": 0.4078, "lr": 2.0671473169230715e-05, "epoch": 1.6166134185303513, "percentage": 54.06, "elapsed_time": "1:29:31", "remaining_time": "1:16:04"}
|
| 254 |
+
{"current_steps": 254, "total_steps": 468, "loss": 0.3872, "lr": 2.0522295688776945e-05, "epoch": 1.623003194888179, "percentage": 54.27, "elapsed_time": "1:29:51", "remaining_time": "1:15:42"}
|
| 255 |
+
{"current_steps": 255, "total_steps": 468, "loss": 0.3415, "lr": 2.037308912460153e-05, "epoch": 1.6293929712460065, "percentage": 54.49, "elapsed_time": "1:30:08", "remaining_time": "1:15:17"}
|
| 256 |
+
{"current_steps": 256, "total_steps": 468, "loss": 0.417, "lr": 2.022386178518236e-05, "epoch": 1.6357827476038338, "percentage": 54.7, "elapsed_time": "1:30:25", "remaining_time": "1:14:52"}
|
| 257 |
+
{"current_steps": 257, "total_steps": 468, "loss": 0.3882, "lr": 2.0074621980154167e-05, "epoch": 1.6421725239616614, "percentage": 54.91, "elapsed_time": "1:30:47", "remaining_time": "1:14:32"}
|
| 258 |
+
{"current_steps": 258, "total_steps": 468, "loss": 0.4104, "lr": 1.9925378019845837e-05, "epoch": 1.648562300319489, "percentage": 55.13, "elapsed_time": "1:31:09", "remaining_time": "1:14:11"}
|
| 259 |
+
{"current_steps": 259, "total_steps": 468, "loss": 0.3774, "lr": 1.9776138214817648e-05, "epoch": 1.6549520766773163, "percentage": 55.34, "elapsed_time": "1:31:29", "remaining_time": "1:13:49"}
|
| 260 |
+
{"current_steps": 260, "total_steps": 468, "loss": 0.3576, "lr": 1.9626910875398475e-05, "epoch": 1.6613418530351438, "percentage": 55.56, "elapsed_time": "1:31:47", "remaining_time": "1:13:26"}
|
| 261 |
+
{"current_steps": 261, "total_steps": 468, "loss": 0.4259, "lr": 1.9477704311223062e-05, "epoch": 1.6677316293929714, "percentage": 55.77, "elapsed_time": "1:32:08", "remaining_time": "1:13:04"}
|
| 262 |
+
{"current_steps": 262, "total_steps": 468, "loss": 0.4159, "lr": 1.932852683076929e-05, "epoch": 1.6741214057507987, "percentage": 55.98, "elapsed_time": "1:32:30", "remaining_time": "1:12:43"}
|
| 263 |
+
{"current_steps": 263, "total_steps": 468, "loss": 0.3925, "lr": 1.9179386740895538e-05, "epoch": 1.680511182108626, "percentage": 56.2, "elapsed_time": "1:32:50", "remaining_time": "1:12:22"}
|
| 264 |
+
{"current_steps": 264, "total_steps": 468, "loss": 0.3598, "lr": 1.9030292346378116e-05, "epoch": 1.6869009584664538, "percentage": 56.41, "elapsed_time": "1:33:14", "remaining_time": "1:12:03"}
|
| 265 |
+
{"current_steps": 265, "total_steps": 468, "loss": 0.4128, "lr": 1.8881251949448817e-05, "epoch": 1.6932907348242812, "percentage": 56.62, "elapsed_time": "1:33:32", "remaining_time": "1:11:39"}
|
| 266 |
+
{"current_steps": 266, "total_steps": 468, "loss": 0.3892, "lr": 1.8732273849332577e-05, "epoch": 1.6996805111821085, "percentage": 56.84, "elapsed_time": "1:33:53", "remaining_time": "1:11:17"}
|
| 267 |
+
{"current_steps": 267, "total_steps": 468, "loss": 0.4135, "lr": 1.8583366341785424e-05, "epoch": 1.706070287539936, "percentage": 57.05, "elapsed_time": "1:34:16", "remaining_time": "1:10:58"}
|
| 268 |
+
{"current_steps": 268, "total_steps": 468, "loss": 0.3966, "lr": 1.8434537718632438e-05, "epoch": 1.7124600638977636, "percentage": 57.26, "elapsed_time": "1:34:34", "remaining_time": "1:10:34"}
|
| 269 |
+
{"current_steps": 269, "total_steps": 468, "loss": 0.3321, "lr": 1.8285796267306098e-05, "epoch": 1.718849840255591, "percentage": 57.48, "elapsed_time": "1:34:57", "remaining_time": "1:10:14"}
|
| 270 |
+
{"current_steps": 270, "total_steps": 468, "loss": 0.4162, "lr": 1.8137150270384755e-05, "epoch": 1.7252396166134185, "percentage": 57.69, "elapsed_time": "1:35:18", "remaining_time": "1:09:53"}
|
| 271 |
+
{"current_steps": 271, "total_steps": 468, "loss": 0.4086, "lr": 1.7988608005131445e-05, "epoch": 1.731629392971246, "percentage": 57.91, "elapsed_time": "1:35:37", "remaining_time": "1:09:31"}
|
| 272 |
+
{"current_steps": 272, "total_steps": 468, "loss": 0.414, "lr": 1.7840177743032964e-05, "epoch": 1.7380191693290734, "percentage": 58.12, "elapsed_time": "1:35:55", "remaining_time": "1:09:07"}
|
| 273 |
+
{"current_steps": 273, "total_steps": 468, "loss": 0.4176, "lr": 1.769186774933929e-05, "epoch": 1.744408945686901, "percentage": 58.33, "elapsed_time": "1:36:18", "remaining_time": "1:08:47"}
|
| 274 |
+
{"current_steps": 274, "total_steps": 468, "loss": 0.4432, "lr": 1.7543686282603318e-05, "epoch": 1.7507987220447285, "percentage": 58.55, "elapsed_time": "1:36:40", "remaining_time": "1:08:27"}
|
| 275 |
+
{"current_steps": 275, "total_steps": 468, "loss": 0.3829, "lr": 1.7395641594220998e-05, "epoch": 1.7571884984025559, "percentage": 58.76, "elapsed_time": "1:36:59", "remaining_time": "1:08:04"}
|
| 276 |
+
{"current_steps": 276, "total_steps": 468, "loss": 0.382, "lr": 1.724774192797186e-05, "epoch": 1.7635782747603834, "percentage": 58.97, "elapsed_time": "1:37:21", "remaining_time": "1:07:43"}
|
| 277 |
+
{"current_steps": 277, "total_steps": 468, "loss": 0.3575, "lr": 1.7099995519559963e-05, "epoch": 1.769968051118211, "percentage": 59.19, "elapsed_time": "1:37:42", "remaining_time": "1:07:22"}
|
| 278 |
+
{"current_steps": 278, "total_steps": 468, "loss": 0.4286, "lr": 1.69524105961553e-05, "epoch": 1.7763578274760383, "percentage": 59.4, "elapsed_time": "1:38:05", "remaining_time": "1:07:02"}
|
| 279 |
+
{"current_steps": 279, "total_steps": 468, "loss": 0.3742, "lr": 1.6804995375935674e-05, "epoch": 1.7827476038338657, "percentage": 59.62, "elapsed_time": "1:38:26", "remaining_time": "1:06:41"}
|
| 280 |
+
{"current_steps": 280, "total_steps": 468, "loss": 0.3685, "lr": 1.665775806762903e-05, "epoch": 1.7891373801916934, "percentage": 59.83, "elapsed_time": "1:38:48", "remaining_time": "1:06:20"}
|
| 281 |
+
{"current_steps": 281, "total_steps": 468, "loss": 0.408, "lr": 1.6510706870056455e-05, "epoch": 1.7955271565495208, "percentage": 60.04, "elapsed_time": "1:39:08", "remaining_time": "1:05:58"}
|
| 282 |
+
{"current_steps": 282, "total_steps": 468, "loss": 0.3659, "lr": 1.6363849971675524e-05, "epoch": 1.8019169329073481, "percentage": 60.26, "elapsed_time": "1:39:24", "remaining_time": "1:05:33"}
|
| 283 |
+
{"current_steps": 283, "total_steps": 468, "loss": 0.3686, "lr": 1.6217195550124397e-05, "epoch": 1.8083067092651757, "percentage": 60.47, "elapsed_time": "1:39:43", "remaining_time": "1:05:11"}
|
| 284 |
+
{"current_steps": 284, "total_steps": 468, "loss": 0.4467, "lr": 1.6070751771766434e-05, "epoch": 1.8146964856230032, "percentage": 60.68, "elapsed_time": "1:40:04", "remaining_time": "1:04:50"}
|
| 285 |
+
{"current_steps": 285, "total_steps": 468, "loss": 0.3776, "lr": 1.592452679123545e-05, "epoch": 1.8210862619808306, "percentage": 60.9, "elapsed_time": "1:40:23", "remaining_time": "1:04:27"}
|
| 286 |
+
{"current_steps": 286, "total_steps": 468, "loss": 0.4504, "lr": 1.577852875098164e-05, "epoch": 1.8274760383386581, "percentage": 61.11, "elapsed_time": "1:40:47", "remaining_time": "1:04:08"}
|
| 287 |
+
{"current_steps": 287, "total_steps": 468, "loss": 0.3501, "lr": 1.563276578081816e-05, "epoch": 1.8338658146964857, "percentage": 61.32, "elapsed_time": "1:41:09", "remaining_time": "1:03:47"}
|
| 288 |
+
{"current_steps": 288, "total_steps": 468, "loss": 0.4209, "lr": 1.5487245997468434e-05, "epoch": 1.840255591054313, "percentage": 61.54, "elapsed_time": "1:41:30", "remaining_time": "1:03:26"}
|
| 289 |
+
{"current_steps": 289, "total_steps": 468, "loss": 0.3647, "lr": 1.5341977504114176e-05, "epoch": 1.8466453674121406, "percentage": 61.75, "elapsed_time": "1:41:49", "remaining_time": "1:03:03"}
|
| 290 |
+
{"current_steps": 290, "total_steps": 468, "loss": 0.4069, "lr": 1.5196968389944153e-05, "epoch": 1.8530351437699681, "percentage": 61.97, "elapsed_time": "1:42:10", "remaining_time": "1:02:42"}
|
| 291 |
+
{"current_steps": 291, "total_steps": 468, "loss": 0.3763, "lr": 1.5052226729703782e-05, "epoch": 1.8594249201277955, "percentage": 62.18, "elapsed_time": "1:42:29", "remaining_time": "1:02:20"}
|
| 292 |
+
{"current_steps": 292, "total_steps": 468, "loss": 0.367, "lr": 1.4907760583245451e-05, "epoch": 1.865814696485623, "percentage": 62.39, "elapsed_time": "1:42:48", "remaining_time": "1:01:58"}
|
| 293 |
+
{"current_steps": 293, "total_steps": 468, "loss": 0.3964, "lr": 1.4763577995079738e-05, "epoch": 1.8722044728434506, "percentage": 62.61, "elapsed_time": "1:43:07", "remaining_time": "1:01:35"}
|
| 294 |
+
{"current_steps": 294, "total_steps": 468, "loss": 0.3378, "lr": 1.461968699392743e-05, "epoch": 1.878594249201278, "percentage": 62.82, "elapsed_time": "1:43:26", "remaining_time": "1:01:12"}
|
| 295 |
+
{"current_steps": 295, "total_steps": 468, "loss": 0.4326, "lr": 1.4476095592272494e-05, "epoch": 1.8849840255591053, "percentage": 63.03, "elapsed_time": "1:43:48", "remaining_time": "1:00:52"}
|
| 296 |
+
{"current_steps": 296, "total_steps": 468, "loss": 0.369, "lr": 1.4332811785915852e-05, "epoch": 1.891373801916933, "percentage": 63.25, "elapsed_time": "1:44:13", "remaining_time": "1:00:33"}
|
| 297 |
+
{"current_steps": 297, "total_steps": 468, "loss": 0.3897, "lr": 1.418984355353019e-05, "epoch": 1.8977635782747604, "percentage": 63.46, "elapsed_time": "1:44:33", "remaining_time": "1:00:11"}
|
| 298 |
+
{"current_steps": 298, "total_steps": 468, "loss": 0.4251, "lr": 1.404719885621563e-05, "epoch": 1.9041533546325877, "percentage": 63.68, "elapsed_time": "1:44:55", "remaining_time": "0:59:51"}
|
| 299 |
+
{"current_steps": 299, "total_steps": 468, "loss": 0.3646, "lr": 1.390488563705644e-05, "epoch": 1.9105431309904153, "percentage": 63.89, "elapsed_time": "1:45:14", "remaining_time": "0:59:28"}
|
| 300 |
+
{"current_steps": 300, "total_steps": 468, "loss": 0.4235, "lr": 1.3762911820678739e-05, "epoch": 1.9169329073482428, "percentage": 64.1, "elapsed_time": "1:45:35", "remaining_time": "0:59:08"}
|
| 301 |
+
{"current_steps": 301, "total_steps": 468, "loss": 0.3794, "lr": 1.3621285312809193e-05, "epoch": 1.9233226837060702, "percentage": 64.32, "elapsed_time": "1:45:56", "remaining_time": "0:58:46"}
|
| 302 |
+
{"current_steps": 302, "total_steps": 468, "loss": 0.4011, "lr": 1.3480013999834811e-05, "epoch": 1.9297124600638977, "percentage": 64.53, "elapsed_time": "1:46:17", "remaining_time": "0:58:25"}
|
| 303 |
+
{"current_steps": 303, "total_steps": 468, "loss": 0.3981, "lr": 1.3339105748363776e-05, "epoch": 1.9361022364217253, "percentage": 64.74, "elapsed_time": "1:46:39", "remaining_time": "0:58:05"}
|
| 304 |
+
{"current_steps": 304, "total_steps": 468, "loss": 0.3767, "lr": 1.3198568404787418e-05, "epoch": 1.9424920127795526, "percentage": 64.96, "elapsed_time": "1:47:00", "remaining_time": "0:57:43"}
|
| 305 |
+
{"current_steps": 305, "total_steps": 468, "loss": 0.4415, "lr": 1.3058409794843288e-05, "epoch": 1.9488817891373802, "percentage": 65.17, "elapsed_time": "1:47:18", "remaining_time": "0:57:21"}
|
| 306 |
+
{"current_steps": 306, "total_steps": 468, "loss": 0.3879, "lr": 1.2918637723179371e-05, "epoch": 1.9552715654952078, "percentage": 65.38, "elapsed_time": "1:47:42", "remaining_time": "0:57:01"}
|
| 307 |
+
{"current_steps": 307, "total_steps": 468, "loss": 0.4269, "lr": 1.2779259972919512e-05, "epoch": 1.961661341853035, "percentage": 65.6, "elapsed_time": "1:48:06", "remaining_time": "0:56:41"}
|
| 308 |
+
{"current_steps": 308, "total_steps": 468, "loss": 0.3205, "lr": 1.2640284305229989e-05, "epoch": 1.9680511182108626, "percentage": 65.81, "elapsed_time": "1:48:29", "remaining_time": "0:56:21"}
|
| 309 |
+
{"current_steps": 309, "total_steps": 468, "loss": 0.395, "lr": 1.2501718458887369e-05, "epoch": 1.9744408945686902, "percentage": 66.03, "elapsed_time": "1:48:49", "remaining_time": "0:55:59"}
|
| 310 |
+
{"current_steps": 310, "total_steps": 468, "loss": 0.3931, "lr": 1.2363570149847556e-05, "epoch": 1.9808306709265175, "percentage": 66.24, "elapsed_time": "1:49:13", "remaining_time": "0:55:40"}
|
| 311 |
+
{"current_steps": 311, "total_steps": 468, "loss": 0.3755, "lr": 1.2225847070816148e-05, "epoch": 1.9872204472843449, "percentage": 66.45, "elapsed_time": "1:49:35", "remaining_time": "0:55:19"}
|
| 312 |
+
{"current_steps": 312, "total_steps": 468, "loss": 0.4243, "lr": 1.208855689082005e-05, "epoch": 1.9936102236421727, "percentage": 66.67, "elapsed_time": "1:49:55", "remaining_time": "0:54:57"}
|
| 313 |
+
{"current_steps": 313, "total_steps": 468, "loss": 0.4858, "lr": 1.1951707254780465e-05, "epoch": 2.0, "percentage": 66.88, "elapsed_time": "1:50:11", "remaining_time": "0:54:34"}
|
| 314 |
+
{"current_steps": 314, "total_steps": 468, "loss": 0.2806, "lr": 1.1815305783087153e-05, "epoch": 2.0063897763578273, "percentage": 67.09, "elapsed_time": "1:51:19", "remaining_time": "0:54:35"}
|
| 315 |
+
{"current_steps": 315, "total_steps": 468, "loss": 0.295, "lr": 1.1679360071174121e-05, "epoch": 2.012779552715655, "percentage": 67.31, "elapsed_time": "1:51:37", "remaining_time": "0:54:12"}
|
| 316 |
+
{"current_steps": 316, "total_steps": 468, "loss": 0.2896, "lr": 1.1543877689096661e-05, "epoch": 2.0191693290734825, "percentage": 67.52, "elapsed_time": "1:52:00", "remaining_time": "0:53:52"}
|
| 317 |
+
{"current_steps": 317, "total_steps": 468, "loss": 0.2837, "lr": 1.1408866181109824e-05, "epoch": 2.02555910543131, "percentage": 67.74, "elapsed_time": "1:52:22", "remaining_time": "0:53:31"}
|
| 318 |
+
{"current_steps": 318, "total_steps": 468, "loss": 0.2856, "lr": 1.1274333065248327e-05, "epoch": 2.0319488817891376, "percentage": 67.95, "elapsed_time": "1:52:43", "remaining_time": "0:53:10"}
|
| 319 |
+
{"current_steps": 319, "total_steps": 468, "loss": 0.2885, "lr": 1.1140285832907888e-05, "epoch": 2.038338658146965, "percentage": 68.16, "elapsed_time": "1:53:04", "remaining_time": "0:52:49"}
|
| 320 |
+
{"current_steps": 320, "total_steps": 468, "loss": 0.3018, "lr": 1.1006731948428118e-05, "epoch": 2.0447284345047922, "percentage": 68.38, "elapsed_time": "1:53:27", "remaining_time": "0:52:28"}
|
| 321 |
+
{"current_steps": 321, "total_steps": 468, "loss": 0.2815, "lr": 1.0873678848676852e-05, "epoch": 2.0511182108626196, "percentage": 68.59, "elapsed_time": "1:53:48", "remaining_time": "0:52:07"}
|