Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:82e90cb4978a2f6c6fe2c414046729b4046411341280b581f5b82c682914537f
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dc344544a6fac01f23e495c94062de7f3510785ac1bd8dd66405904b2203e216
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23fbd71df21ec4d466453ba06e7e79c24ba17775c151cd4bb6bbabc17b937497
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e62ab16b98650c167fde9ef8bb591f1594cfc5eac2e08d45c48a63e1515156ab
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -220,3 +220,115 @@
|
|
| 220 |
{"current_steps": 220, "total_steps": 333, "loss": 0.4197, "lr": 2.503305686485991e-05, "epoch": 1.9778214486243684, "percentage": 66.07, "elapsed_time": "21:07:59", "remaining_time": "10:51:17"}
|
| 221 |
{"current_steps": 221, "total_steps": 333, "loss": 0.4085, "lr": 2.464413991568222e-05, "epoch": 1.9868051656372825, "percentage": 66.37, "elapsed_time": "21:13:28", "remaining_time": "10:45:22"}
|
| 222 |
{"current_steps": 222, "total_steps": 333, "loss": 0.4325, "lr": 2.4256918192173088e-05, "epoch": 1.9957888826501966, "percentage": 66.67, "elapsed_time": "21:19:27", "remaining_time": "10:39:43"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 220 |
{"current_steps": 220, "total_steps": 333, "loss": 0.4197, "lr": 2.503305686485991e-05, "epoch": 1.9778214486243684, "percentage": 66.07, "elapsed_time": "21:07:59", "remaining_time": "10:51:17"}
|
| 221 |
{"current_steps": 221, "total_steps": 333, "loss": 0.4085, "lr": 2.464413991568222e-05, "epoch": 1.9868051656372825, "percentage": 66.37, "elapsed_time": "21:13:28", "remaining_time": "10:45:22"}
|
| 222 |
{"current_steps": 222, "total_steps": 333, "loss": 0.4325, "lr": 2.4256918192173088e-05, "epoch": 1.9957888826501966, "percentage": 66.67, "elapsed_time": "21:19:27", "remaining_time": "10:39:43"}
|
| 223 |
+
{"current_steps": 223, "total_steps": 333, "loss": 0.7473, "lr": 2.3871434442065414e-05, "epoch": 2.0061763054463784, "percentage": 66.97, "elapsed_time": "21:25:55", "remaining_time": "10:34:18"}
|
| 224 |
+
{"current_steps": 224, "total_steps": 333, "loss": 0.3817, "lr": 2.3487731221226754e-05, "epoch": 2.0151600224592925, "percentage": 67.27, "elapsed_time": "21:31:36", "remaining_time": "10:28:30"}
|
| 225 |
+
{"current_steps": 225, "total_steps": 333, "loss": 0.4043, "lr": 2.3105850888961348e-05, "epoch": 2.0241437394722066, "percentage": 67.57, "elapsed_time": "21:37:38", "remaining_time": "10:22:52"}
|
| 226 |
+
{"current_steps": 226, "total_steps": 333, "loss": 0.3908, "lr": 2.272583560333379e-05, "epoch": 2.0331274564851207, "percentage": 67.87, "elapsed_time": "21:43:24", "remaining_time": "10:17:05"}
|
| 227 |
+
{"current_steps": 227, "total_steps": 333, "loss": 0.3963, "lr": 2.2347727316515e-05, "epoch": 2.042111173498035, "percentage": 68.17, "elapsed_time": "21:49:22", "remaining_time": "10:11:25"}
|
| 228 |
+
{"current_steps": 228, "total_steps": 333, "loss": 0.3875, "lr": 2.1971567770150814e-05, "epoch": 2.051094890510949, "percentage": 68.47, "elapsed_time": "21:55:12", "remaining_time": "10:05:41"}
|
| 229 |
+
{"current_steps": 229, "total_steps": 333, "loss": 0.4031, "lr": 2.1597398490753917e-05, "epoch": 2.060078607523863, "percentage": 68.77, "elapsed_time": "22:00:54", "remaining_time": "9:59:53"}
|
| 230 |
+
{"current_steps": 230, "total_steps": 333, "loss": 0.3891, "lr": 2.1225260785119456e-05, "epoch": 2.069062324536777, "percentage": 69.07, "elapsed_time": "22:06:39", "remaining_time": "9:54:06"}
|
| 231 |
+
{"current_steps": 231, "total_steps": 333, "loss": 0.3906, "lr": 2.0855195735764947e-05, "epoch": 2.0780460415496913, "percentage": 69.37, "elapsed_time": "22:12:40", "remaining_time": "9:48:27"}
|
| 232 |
+
{"current_steps": 232, "total_steps": 333, "loss": 0.3941, "lr": 2.0487244196394912e-05, "epoch": 2.0870297585626054, "percentage": 69.67, "elapsed_time": "22:18:27", "remaining_time": "9:42:41"}
|
| 233 |
+
{"current_steps": 233, "total_steps": 333, "loss": 0.3799, "lr": 2.0121446787390822e-05, "epoch": 2.0960134755755195, "percentage": 69.97, "elapsed_time": "22:24:21", "remaining_time": "9:36:58"}
|
| 234 |
+
{"current_steps": 234, "total_steps": 333, "loss": 0.3951, "lr": 1.9757843891326736e-05, "epoch": 2.1049971925884337, "percentage": 70.27, "elapsed_time": "22:29:49", "remaining_time": "9:31:04"}
|
| 235 |
+
{"current_steps": 235, "total_steps": 333, "loss": 0.3928, "lr": 1.939647564851127e-05, "epoch": 2.1139809096013478, "percentage": 70.57, "elapsed_time": "22:35:40", "remaining_time": "9:25:20"}
|
| 236 |
+
{"current_steps": 236, "total_steps": 333, "loss": 0.3891, "lr": 1.9037381952556217e-05, "epoch": 2.1229646266142614, "percentage": 70.87, "elapsed_time": "22:41:28", "remaining_time": "9:19:35"}
|
| 237 |
+
{"current_steps": 237, "total_steps": 333, "loss": 0.3967, "lr": 1.8680602445972463e-05, "epoch": 2.1319483436271756, "percentage": 71.17, "elapsed_time": "22:47:22", "remaining_time": "9:13:52"}
|
| 238 |
+
{"current_steps": 238, "total_steps": 333, "loss": 0.3859, "lr": 1.832617651579365e-05, "epoch": 2.1409320606400897, "percentage": 71.47, "elapsed_time": "22:53:06", "remaining_time": "9:08:05"}
|
| 239 |
+
{"current_steps": 239, "total_steps": 333, "loss": 0.3878, "lr": 1.797414328922797e-05, "epoch": 2.149915777653004, "percentage": 71.77, "elapsed_time": "22:58:48", "remaining_time": "9:02:17"}
|
| 240 |
+
{"current_steps": 240, "total_steps": 333, "loss": 0.3902, "lr": 1.7624541629338676e-05, "epoch": 2.158899494665918, "percentage": 72.07, "elapsed_time": "23:04:24", "remaining_time": "8:56:27"}
|
| 241 |
+
{"current_steps": 241, "total_steps": 333, "loss": 0.3803, "lr": 1.7277410130753775e-05, "epoch": 2.167883211678832, "percentage": 72.37, "elapsed_time": "23:10:14", "remaining_time": "8:50:42"}
|
| 242 |
+
{"current_steps": 242, "total_steps": 333, "loss": 0.4038, "lr": 1.6932787115405318e-05, "epoch": 2.176866928691746, "percentage": 72.67, "elapsed_time": "23:16:02", "remaining_time": "8:44:57"}
|
| 243 |
+
{"current_steps": 243, "total_steps": 333, "loss": 0.4097, "lr": 1.6590710628298826e-05, "epoch": 2.1858506457046603, "percentage": 72.97, "elapsed_time": "23:21:41", "remaining_time": "8:39:08"}
|
| 244 |
+
{"current_steps": 244, "total_steps": 333, "loss": 0.3841, "lr": 1.6251218433313254e-05, "epoch": 2.1948343627175744, "percentage": 73.27, "elapsed_time": "23:27:06", "remaining_time": "8:33:14"}
|
| 245 |
+
{"current_steps": 245, "total_steps": 333, "loss": 0.3879, "lr": 1.591434800903203e-05, "epoch": 2.2038180797304885, "percentage": 73.57, "elapsed_time": "23:32:45", "remaining_time": "8:27:26"}
|
| 246 |
+
{"current_steps": 246, "total_steps": 333, "loss": 0.3831, "lr": 1.558013654460555e-05, "epoch": 2.2128017967434026, "percentage": 73.87, "elapsed_time": "23:38:24", "remaining_time": "8:21:37"}
|
| 247 |
+
{"current_steps": 247, "total_steps": 333, "loss": 0.3932, "lr": 1.5248620935645666e-05, "epoch": 2.2217855137563167, "percentage": 74.17, "elapsed_time": "23:44:06", "remaining_time": "8:15:50"}
|
| 248 |
+
{"current_steps": 248, "total_steps": 333, "loss": 0.3793, "lr": 1.4919837780152544e-05, "epoch": 2.230769230769231, "percentage": 74.47, "elapsed_time": "23:49:39", "remaining_time": "8:10:00"}
|
| 249 |
+
{"current_steps": 249, "total_steps": 333, "loss": 0.3884, "lr": 1.4593823374474374e-05, "epoch": 2.239752947782145, "percentage": 74.77, "elapsed_time": "23:55:23", "remaining_time": "8:04:13"}
|
| 250 |
+
{"current_steps": 250, "total_steps": 333, "loss": 0.3883, "lr": 1.4270613709300429e-05, "epoch": 2.248736664795059, "percentage": 75.08, "elapsed_time": "1 day, 0:01:03", "remaining_time": "7:58:25"}
|
| 251 |
+
{"current_steps": 251, "total_steps": 333, "loss": 0.3925, "lr": 1.3950244465687833e-05, "epoch": 2.257720381807973, "percentage": 75.38, "elapsed_time": "1 day, 0:07:00", "remaining_time": "7:52:43"}
|
| 252 |
+
{"current_steps": 252, "total_steps": 333, "loss": 0.3988, "lr": 1.3632751011122497e-05, "epoch": 2.2667040988208873, "percentage": 75.68, "elapsed_time": "1 day, 0:13:01", "remaining_time": "7:47:02"}
|
| 253 |
+
{"current_steps": 253, "total_steps": 333, "loss": 0.3857, "lr": 1.3318168395614697e-05, "epoch": 2.2756878158338014, "percentage": 75.98, "elapsed_time": "1 day, 0:18:33", "remaining_time": "7:41:12"}
|
| 254 |
+
{"current_steps": 254, "total_steps": 333, "loss": 0.4054, "lr": 1.3006531347829699e-05, "epoch": 2.2846715328467155, "percentage": 76.28, "elapsed_time": "1 day, 0:24:26", "remaining_time": "7:35:28"}
|
| 255 |
+
{"current_steps": 255, "total_steps": 333, "loss": 0.389, "lr": 1.2697874271253844e-05, "epoch": 2.293655249859629, "percentage": 76.58, "elapsed_time": "1 day, 0:30:23", "remaining_time": "7:29:45"}
|
| 256 |
+
{"current_steps": 256, "total_steps": 333, "loss": 0.398, "lr": 1.2392231240396542e-05, "epoch": 2.3026389668725433, "percentage": 76.88, "elapsed_time": "1 day, 0:35:58", "remaining_time": "7:23:56"}
|
| 257 |
+
{"current_steps": 257, "total_steps": 333, "loss": 0.3964, "lr": 1.2089635997028592e-05, "epoch": 2.3116226838854574, "percentage": 77.18, "elapsed_time": "1 day, 0:41:49", "remaining_time": "7:18:12"}
|
| 258 |
+
{"current_steps": 258, "total_steps": 333, "loss": 0.3827, "lr": 1.1790121946457212e-05, "epoch": 2.3206064008983716, "percentage": 77.48, "elapsed_time": "1 day, 0:47:40", "remaining_time": "7:12:27"}
|
| 259 |
+
{"current_steps": 259, "total_steps": 333, "loss": 0.403, "lr": 1.1493722153838239e-05, "epoch": 2.3295901179112857, "percentage": 77.78, "elapsed_time": "1 day, 0:53:30", "remaining_time": "7:06:42"}
|
| 260 |
+
{"current_steps": 260, "total_steps": 333, "loss": 0.3774, "lr": 1.120046934052585e-05, "epoch": 2.3385738349242, "percentage": 78.08, "elapsed_time": "1 day, 0:59:03", "remaining_time": "7:00:53"}
|
| 261 |
+
{"current_steps": 261, "total_steps": 333, "loss": 0.3994, "lr": 1.0910395880460274e-05, "epoch": 2.347557551937114, "percentage": 78.38, "elapsed_time": "1 day, 1:04:35", "remaining_time": "6:55:03"}
|
| 262 |
+
{"current_steps": 262, "total_steps": 333, "loss": 0.3959, "lr": 1.062353379659383e-05, "epoch": 2.356541268950028, "percentage": 78.68, "elapsed_time": "1 day, 1:10:12", "remaining_time": "6:49:15"}
|
| 263 |
+
{"current_steps": 263, "total_steps": 333, "loss": 0.3909, "lr": 1.0339914757355718e-05, "epoch": 2.365524985962942, "percentage": 78.98, "elapsed_time": "1 day, 1:16:05", "remaining_time": "6:43:31"}
|
| 264 |
+
{"current_steps": 264, "total_steps": 333, "loss": 0.3964, "lr": 1.0059570073155953e-05, "epoch": 2.3745087029758563, "percentage": 79.28, "elapsed_time": "1 day, 1:21:45", "remaining_time": "6:37:43"}
|
| 265 |
+
{"current_steps": 265, "total_steps": 333, "loss": 0.3962, "lr": 9.782530692928832e-06, "epoch": 2.3834924199887704, "percentage": 79.58, "elapsed_time": "1 day, 1:27:35", "remaining_time": "6:31:59"}
|
| 266 |
+
{"current_steps": 266, "total_steps": 333, "loss": 0.3987, "lr": 9.508827200716273e-06, "epoch": 2.3924761370016845, "percentage": 79.88, "elapsed_time": "1 day, 1:33:24", "remaining_time": "6:26:14"}
|
| 267 |
+
{"current_steps": 267, "total_steps": 333, "loss": 0.3851, "lr": 9.238489812291469e-06, "epoch": 2.4014598540145986, "percentage": 80.18, "elapsed_time": "1 day, 1:39:13", "remaining_time": "6:20:29"}
|
| 268 |
+
{"current_steps": 268, "total_steps": 333, "loss": 0.3972, "lr": 8.971548371823205e-06, "epoch": 2.4104435710275127, "percentage": 80.48, "elapsed_time": "1 day, 1:45:12", "remaining_time": "6:14:46"}
|
| 269 |
+
{"current_steps": 269, "total_steps": 333, "loss": 0.401, "lr": 8.708032348581144e-06, "epoch": 2.419427288040427, "percentage": 80.78, "elapsed_time": "1 day, 1:50:55", "remaining_time": "6:08:59"}
|
| 270 |
+
{"current_steps": 270, "total_steps": 333, "loss": 0.3801, "lr": 8.447970833682584e-06, "epoch": 2.428411005053341, "percentage": 81.08, "elapsed_time": "1 day, 1:56:36", "remaining_time": "6:03:12"}
|
| 271 |
+
{"current_steps": 271, "total_steps": 333, "loss": 0.3835, "lr": 8.191392536880852e-06, "epoch": 2.437394722066255, "percentage": 81.38, "elapsed_time": "1 day, 2:02:37", "remaining_time": "5:57:30"}
|
| 272 |
+
{"current_steps": 272, "total_steps": 333, "loss": 0.3924, "lr": 7.938325783395924e-06, "epoch": 2.446378439079169, "percentage": 81.68, "elapsed_time": "1 day, 2:08:35", "remaining_time": "5:51:46"}
|
| 273 |
+
{"current_steps": 273, "total_steps": 333, "loss": 0.3839, "lr": 7.68879851078741e-06, "epoch": 2.4553621560920833, "percentage": 81.98, "elapsed_time": "1 day, 2:14:07", "remaining_time": "5:45:57"}
|
| 274 |
+
{"current_steps": 274, "total_steps": 333, "loss": 0.4029, "lr": 7.442838265870347e-06, "epoch": 2.464345873104997, "percentage": 82.28, "elapsed_time": "1 day, 2:19:51", "remaining_time": "5:40:11"}
|
| 275 |
+
{"current_steps": 275, "total_steps": 333, "loss": 0.3933, "lr": 7.2004722016741605e-06, "epoch": 2.473329590117911, "percentage": 82.58, "elapsed_time": "1 day, 2:25:28", "remaining_time": "5:34:23"}
|
| 276 |
+
{"current_steps": 276, "total_steps": 333, "loss": 0.3984, "lr": 6.961727074445055e-06, "epoch": 2.482313307130825, "percentage": 82.88, "elapsed_time": "1 day, 2:31:28", "remaining_time": "5:28:40"}
|
| 277 |
+
{"current_steps": 277, "total_steps": 333, "loss": 0.378, "lr": 6.726629240692255e-06, "epoch": 2.4912970241437393, "percentage": 83.18, "elapsed_time": "1 day, 2:37:15", "remaining_time": "5:22:54"}
|
| 278 |
+
{"current_steps": 278, "total_steps": 333, "loss": 0.3794, "lr": 6.4952046542783395e-06, "epoch": 2.5002807411566534, "percentage": 83.48, "elapsed_time": "1 day, 2:42:42", "remaining_time": "5:17:04"}
|
| 279 |
+
{"current_steps": 279, "total_steps": 333, "loss": 0.3905, "lr": 6.2674788635540415e-06, "epoch": 2.5092644581695676, "percentage": 83.78, "elapsed_time": "1 day, 2:48:16", "remaining_time": "5:11:16"}
|
| 280 |
+
{"current_steps": 280, "total_steps": 333, "loss": 0.4005, "lr": 6.04347700853781e-06, "epoch": 2.5182481751824817, "percentage": 84.08, "elapsed_time": "1 day, 2:54:00", "remaining_time": "5:05:30"}
|
| 281 |
+
{"current_steps": 281, "total_steps": 333, "loss": 0.3826, "lr": 5.823223818140458e-06, "epoch": 2.527231892195396, "percentage": 84.38, "elapsed_time": "1 day, 2:59:42", "remaining_time": "4:59:43"}
|
| 282 |
+
{"current_steps": 282, "total_steps": 333, "loss": 0.3862, "lr": 5.606743607435183e-06, "epoch": 2.53621560920831, "percentage": 84.68, "elapsed_time": "1 day, 3:05:30", "remaining_time": "4:53:58"}
|
| 283 |
+
{"current_steps": 283, "total_steps": 333, "loss": 0.4022, "lr": 5.394060274973267e-06, "epoch": 2.545199326221224, "percentage": 84.98, "elapsed_time": "1 day, 3:11:11", "remaining_time": "4:48:11"}
|
| 284 |
+
{"current_steps": 284, "total_steps": 333, "loss": 0.3772, "lr": 5.185197300145817e-06, "epoch": 2.554183043234138, "percentage": 85.29, "elapsed_time": "1 day, 3:16:47", "remaining_time": "4:42:24"}
|
| 285 |
+
{"current_steps": 285, "total_steps": 333, "loss": 0.4074, "lr": 4.980177740591678e-06, "epoch": 2.5631667602470523, "percentage": 85.59, "elapsed_time": "1 day, 3:22:25", "remaining_time": "4:36:37"}
|
| 286 |
+
{"current_steps": 286, "total_steps": 333, "loss": 0.3946, "lr": 4.779024229652005e-06, "epoch": 2.5721504772599664, "percentage": 85.89, "elapsed_time": "1 day, 3:28:08", "remaining_time": "4:30:50"}
|
| 287 |
+
{"current_steps": 287, "total_steps": 333, "loss": 0.3948, "lr": 4.581758973871609e-06, "epoch": 2.5811341942728805, "percentage": 86.19, "elapsed_time": "1 day, 3:33:45", "remaining_time": "4:25:03"}
|
| 288 |
+
{"current_steps": 288, "total_steps": 333, "loss": 0.3834, "lr": 4.3884037505474455e-06, "epoch": 2.5901179112857946, "percentage": 86.49, "elapsed_time": "1 day, 3:39:33", "remaining_time": "4:19:18"}
|
| 289 |
+
{"current_steps": 289, "total_steps": 333, "loss": 0.3839, "lr": 4.198979905324496e-06, "epoch": 2.5991016282987087, "percentage": 86.79, "elapsed_time": "1 day, 3:45:13", "remaining_time": "4:13:31"}
|
| 290 |
+
{"current_steps": 290, "total_steps": 333, "loss": 0.4005, "lr": 4.0135083498392905e-06, "epoch": 2.608085345311623, "percentage": 87.09, "elapsed_time": "1 day, 3:51:11", "remaining_time": "4:07:47"}
|
| 291 |
+
{"current_steps": 291, "total_steps": 333, "loss": 0.3946, "lr": 3.832009559411338e-06, "epoch": 2.6170690623245365, "percentage": 87.39, "elapsed_time": "1 day, 3:56:49", "remaining_time": "4:02:00"}
|
| 292 |
+
{"current_steps": 292, "total_steps": 333, "loss": 0.3797, "lr": 3.654503570782755e-06, "epoch": 2.626052779337451, "percentage": 87.69, "elapsed_time": "1 day, 4:02:49", "remaining_time": "3:56:17"}
|
| 293 |
+
{"current_steps": 293, "total_steps": 333, "loss": 0.3977, "lr": 3.481009979906258e-06, "epoch": 2.6350364963503647, "percentage": 87.99, "elapsed_time": "1 day, 4:08:39", "remaining_time": "3:50:31"}
|
| 294 |
+
{"current_steps": 294, "total_steps": 333, "loss": 0.3944, "lr": 3.311547939781887e-06, "epoch": 2.6440202133632793, "percentage": 88.29, "elapsed_time": "1 day, 4:14:19", "remaining_time": "3:44:45"}
|
| 295 |
+
{"current_steps": 295, "total_steps": 333, "loss": 0.3851, "lr": 3.14613615834253e-06, "epoch": 2.653003930376193, "percentage": 88.59, "elapsed_time": "1 day, 4:20:08", "remaining_time": "3:39:00"}
|
| 296 |
+
{"current_steps": 296, "total_steps": 333, "loss": 0.3955, "lr": 2.9847928963887198e-06, "epoch": 2.661987647389107, "percentage": 88.89, "elapsed_time": "1 day, 4:25:58", "remaining_time": "3:33:14"}
|
| 297 |
+
{"current_steps": 297, "total_steps": 333, "loss": 0.3918, "lr": 2.8275359655726586e-06, "epoch": 2.670971364402021, "percentage": 89.19, "elapsed_time": "1 day, 4:31:47", "remaining_time": "3:27:29"}
|
| 298 |
+
{"current_steps": 298, "total_steps": 333, "loss": 0.3916, "lr": 2.6743827264319012e-06, "epoch": 2.6799550814149353, "percentage": 89.49, "elapsed_time": "1 day, 4:37:41", "remaining_time": "3:21:44"}
|
| 299 |
+
{"current_steps": 299, "total_steps": 333, "loss": 0.3846, "lr": 2.5253500864728155e-06, "epoch": 2.6889387984278494, "percentage": 89.79, "elapsed_time": "1 day, 4:43:31", "remaining_time": "3:15:59"}
|
| 300 |
+
{"current_steps": 300, "total_steps": 333, "loss": 0.3824, "lr": 2.3804544983040724e-06, "epoch": 2.6979225154407636, "percentage": 90.09, "elapsed_time": "1 day, 4:49:17", "remaining_time": "3:10:13"}
|
| 301 |
+
{"current_steps": 301, "total_steps": 333, "loss": 0.3927, "lr": 2.23971195782033e-06, "epoch": 2.7069062324536777, "percentage": 90.39, "elapsed_time": "1 day, 4:55:03", "remaining_time": "3:04:27"}
|
| 302 |
+
{"current_steps": 302, "total_steps": 333, "loss": 0.3993, "lr": 2.1031380024363645e-06, "epoch": 2.715889949466592, "percentage": 90.69, "elapsed_time": "1 day, 5:01:01", "remaining_time": "2:58:42"}
|
| 303 |
+
{"current_steps": 303, "total_steps": 333, "loss": 0.386, "lr": 1.9707477093717786e-06, "epoch": 2.724873666479506, "percentage": 90.99, "elapsed_time": "1 day, 5:06:46", "remaining_time": "2:52:56"}
|
| 304 |
+
{"current_steps": 304, "total_steps": 333, "loss": 0.3816, "lr": 1.8425556939865696e-06, "epoch": 2.73385738349242, "percentage": 91.29, "elapsed_time": "1 day, 5:12:21", "remaining_time": "2:47:09"}
|
| 305 |
+
{"current_steps": 305, "total_steps": 333, "loss": 0.3914, "lr": 1.7185761081676222e-06, "epoch": 2.742841100505334, "percentage": 91.59, "elapsed_time": "1 day, 5:17:43", "remaining_time": "2:41:21"}
|
| 306 |
+
{"current_steps": 306, "total_steps": 333, "loss": 0.3826, "lr": 1.5988226387664151e-06, "epoch": 2.7518248175182483, "percentage": 91.89, "elapsed_time": "1 day, 5:23:33", "remaining_time": "2:35:36"}
|
| 307 |
+
{"current_steps": 307, "total_steps": 333, "loss": 0.3933, "lr": 1.4833085060880349e-06, "epoch": 2.7608085345311624, "percentage": 92.19, "elapsed_time": "1 day, 5:29:13", "remaining_time": "2:29:50"}
|
| 308 |
+
{"current_steps": 308, "total_steps": 333, "loss": 0.3754, "lr": 1.3720464624317108e-06, "epoch": 2.7697922515440765, "percentage": 92.49, "elapsed_time": "1 day, 5:34:49", "remaining_time": "2:24:03"}
|
| 309 |
+
{"current_steps": 309, "total_steps": 333, "loss": 0.4084, "lr": 1.2650487906830234e-06, "epoch": 2.7787759685569906, "percentage": 92.79, "elapsed_time": "1 day, 5:40:44", "remaining_time": "2:18:18"}
|
| 310 |
+
{"current_steps": 310, "total_steps": 333, "loss": 0.3757, "lr": 1.1623273029579195e-06, "epoch": 2.7877596855699043, "percentage": 93.09, "elapsed_time": "1 day, 5:46:10", "remaining_time": "2:12:31"}
|
| 311 |
+
{"current_steps": 311, "total_steps": 333, "loss": 0.3957, "lr": 1.063893339298674e-06, "epoch": 2.796743402582819, "percentage": 93.39, "elapsed_time": "1 day, 5:51:52", "remaining_time": "2:06:45"}
|
| 312 |
+
{"current_steps": 312, "total_steps": 333, "loss": 0.3943, "lr": 9.697577664220303e-07, "epoch": 2.8057271195957325, "percentage": 93.69, "elapsed_time": "1 day, 5:57:30", "remaining_time": "2:00:59"}
|
| 313 |
+
{"current_steps": 313, "total_steps": 333, "loss": 0.3865, "lr": 8.799309765195452e-07, "epoch": 2.814710836608647, "percentage": 93.99, "elapsed_time": "1 day, 6:03:31", "remaining_time": "1:55:14"}
|
| 314 |
+
{"current_steps": 314, "total_steps": 333, "loss": 0.393, "lr": 7.944228861103264e-07, "epoch": 2.8236945536215607, "percentage": 94.29, "elapsed_time": "1 day, 6:09:30", "remaining_time": "1:49:29"}
|
| 315 |
+
{"current_steps": 315, "total_steps": 333, "loss": 0.387, "lr": 7.132429349463011e-07, "epoch": 2.832678270634475, "percentage": 94.59, "elapsed_time": "1 day, 6:15:14", "remaining_time": "1:43:43"}
|
| 316 |
+
{"current_steps": 316, "total_steps": 333, "loss": 0.391, "lr": 6.364000849700791e-07, "epoch": 2.841661987647389, "percentage": 94.89, "elapsed_time": "1 day, 6:21:11", "remaining_time": "1:37:58"}
|
| 317 |
+
{"current_steps": 317, "total_steps": 333, "loss": 0.3974, "lr": 5.639028193256257e-07, "epoch": 2.850645704660303, "percentage": 95.2, "elapsed_time": "1 day, 6:26:58", "remaining_time": "1:32:12"}
|
| 318 |
+
{"current_steps": 318, "total_steps": 333, "loss": 0.3912, "lr": 4.957591414217344e-07, "epoch": 2.859629421673217, "percentage": 95.5, "elapsed_time": "1 day, 6:32:52", "remaining_time": "1:26:27"}
|
| 319 |
+
{"current_steps": 319, "total_steps": 333, "loss": 0.3871, "lr": 4.3197657404848935e-07, "epoch": 2.8686131386861313, "percentage": 95.8, "elapsed_time": "1 day, 6:38:34", "remaining_time": "1:20:41"}
|
| 320 |
+
{"current_steps": 320, "total_steps": 333, "loss": 0.3955, "lr": 3.725621585467698e-07, "epoch": 2.8775968556990454, "percentage": 96.1, "elapsed_time": "1 day, 6:44:33", "remaining_time": "1:14:56"}
|
| 321 |
+
{"current_steps": 321, "total_steps": 333, "loss": 0.3889, "lr": 3.1752245403092963e-07, "epoch": 2.8865805727119596, "percentage": 96.4, "elapsed_time": "1 day, 6:50:37", "remaining_time": "1:09:10"}
|
| 322 |
+
{"current_steps": 322, "total_steps": 333, "loss": 0.3876, "lr": 2.6686353666468323e-07, "epoch": 2.8955642897248737, "percentage": 96.7, "elapsed_time": "1 day, 6:56:13", "remaining_time": "1:03:24"}
|
| 323 |
+
{"current_steps": 323, "total_steps": 333, "loss": 0.3928, "lr": 2.2059099899033098e-07, "epoch": 2.904548006737788, "percentage": 97.0, "elapsed_time": "1 day, 7:01:56", "remaining_time": "0:57:38"}
|
| 324 |
+
{"current_steps": 324, "total_steps": 333, "loss": 0.3856, "lr": 1.7870994931135977e-07, "epoch": 2.913531723750702, "percentage": 97.3, "elapsed_time": "1 day, 7:07:41", "remaining_time": "0:51:52"}
|
| 325 |
+
{"current_steps": 325, "total_steps": 333, "loss": 0.3976, "lr": 1.412250111285074e-07, "epoch": 2.922515440763616, "percentage": 97.6, "elapsed_time": "1 day, 7:13:20", "remaining_time": "0:46:06"}
|
| 326 |
+
{"current_steps": 326, "total_steps": 333, "loss": 0.3809, "lr": 1.0814032262935315e-07, "epoch": 2.93149915777653, "percentage": 97.9, "elapsed_time": "1 day, 7:19:11", "remaining_time": "0:40:21"}
|
| 327 |
+
{"current_steps": 327, "total_steps": 333, "loss": 0.3791, "lr": 7.945953623146096e-08, "epoch": 2.9404828747894443, "percentage": 98.2, "elapsed_time": "1 day, 7:25:05", "remaining_time": "0:34:35"}
|
| 328 |
+
{"current_steps": 328, "total_steps": 333, "loss": 0.3928, "lr": 5.518581817918645e-08, "epoch": 2.9494665918023584, "percentage": 98.5, "elapsed_time": "1 day, 7:30:52", "remaining_time": "0:28:49"}
|
| 329 |
+
{"current_steps": 329, "total_steps": 333, "loss": 0.3875, "lr": 3.532184819412532e-08, "epoch": 2.958450308815272, "percentage": 98.8, "elapsed_time": "1 day, 7:36:42", "remaining_time": "0:23:03"}
|
| 330 |
+
{"current_steps": 330, "total_steps": 333, "loss": 0.3902, "lr": 1.9869819179292315e-08, "epoch": 2.9674340258281866, "percentage": 99.1, "elapsed_time": "1 day, 7:42:17", "remaining_time": "0:17:17"}
|
| 331 |
+
{"current_steps": 331, "total_steps": 333, "loss": 0.3928, "lr": 8.83143697702149e-09, "epoch": 2.9764177428411003, "percentage": 99.4, "elapsed_time": "1 day, 7:48:24", "remaining_time": "0:11:31"}
|
| 332 |
+
{"current_steps": 332, "total_steps": 333, "loss": 0.3867, "lr": 2.2079201806501916e-09, "epoch": 2.985401459854015, "percentage": 99.7, "elapsed_time": "1 day, 7:54:11", "remaining_time": "0:05:45"}
|
| 333 |
+
{"current_steps": 333, "total_steps": 333, "loss": 0.3902, "lr": 0.0, "epoch": 2.9943851768669285, "percentage": 100.0, "elapsed_time": "1 day, 8:00:05", "remaining_time": "0:00:00"}
|
| 334 |
+
{"current_steps": 333, "total_steps": 333, "epoch": 2.9943851768669285, "percentage": 100.0, "elapsed_time": "1 day, 8:01:39", "remaining_time": "0:00:00"}
|