Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0a5759541c4c435b10f900c6ac234a6feccb5bf141f6c5934a1471cd125a0050
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b47eedfef1a2f38d93761795a11caeeb3de29452f8f3a55b95b2af8075f7ac6a
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bae0c59c8d9bd7898b656efcb69e6ef76cb2e71d86374b2b3fd46019adc634cb
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:75b7b6e0328d25a69ba1f60c0e2c3612e6f61edcc1bc2e27fbcbd47e9e6acf8f
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -220,3 +220,115 @@
|
|
| 220 |
{"current_steps": 220, "total_steps": 333, "loss": 0.4098, "lr": 3.540208696455256e-05, "epoch": 1.9778214486243684, "percentage": 66.07, "elapsed_time": "21:06:35", "remaining_time": "10:50:33"}
|
| 221 |
{"current_steps": 221, "total_steps": 333, "loss": 0.3992, "lr": 3.485207536464666e-05, "epoch": 1.9868051656372825, "percentage": 66.37, "elapsed_time": "21:12:03", "remaining_time": "10:44:39"}
|
| 222 |
{"current_steps": 222, "total_steps": 333, "loss": 0.4227, "lr": 3.4304461175766773e-05, "epoch": 1.9957888826501966, "percentage": 66.67, "elapsed_time": "21:18:02", "remaining_time": "10:39:01"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 220 |
{"current_steps": 220, "total_steps": 333, "loss": 0.4098, "lr": 3.540208696455256e-05, "epoch": 1.9778214486243684, "percentage": 66.07, "elapsed_time": "21:06:35", "remaining_time": "10:50:33"}
|
| 221 |
{"current_steps": 221, "total_steps": 333, "loss": 0.3992, "lr": 3.485207536464666e-05, "epoch": 1.9868051656372825, "percentage": 66.37, "elapsed_time": "21:12:03", "remaining_time": "10:44:39"}
|
| 222 |
{"current_steps": 222, "total_steps": 333, "loss": 0.4227, "lr": 3.4304461175766773e-05, "epoch": 1.9957888826501966, "percentage": 66.67, "elapsed_time": "21:18:02", "remaining_time": "10:39:01"}
|
| 223 |
+
{"current_steps": 223, "total_steps": 333, "loss": 0.7234, "lr": 3.3759304852333874e-05, "epoch": 2.0061763054463784, "percentage": 66.97, "elapsed_time": "21:24:30", "remaining_time": "10:33:36"}
|
| 224 |
+
{"current_steps": 224, "total_steps": 333, "loss": 0.364, "lr": 3.321666657743036e-05, "epoch": 2.0151600224592925, "percentage": 67.27, "elapsed_time": "21:30:10", "remaining_time": "10:27:48"}
|
| 225 |
+
{"current_steps": 225, "total_steps": 333, "loss": 0.3852, "lr": 3.2676606256156134e-05, "epoch": 2.0241437394722066, "percentage": 67.57, "elapsed_time": "21:36:12", "remaining_time": "10:22:10"}
|
| 226 |
+
{"current_steps": 226, "total_steps": 333, "loss": 0.3734, "lr": 3.213918350901529e-05, "epoch": 2.0331274564851207, "percentage": 67.87, "elapsed_time": "21:41:58", "remaining_time": "10:16:25"}
|
| 227 |
+
{"current_steps": 227, "total_steps": 333, "loss": 0.3779, "lr": 3.1604457665334285e-05, "epoch": 2.042111173498035, "percentage": 68.17, "elapsed_time": "21:47:56", "remaining_time": "10:10:45"}
|
| 228 |
+
{"current_steps": 228, "total_steps": 333, "loss": 0.3698, "lr": 3.107248775671218e-05, "epoch": 2.051094890510949, "percentage": 68.47, "elapsed_time": "21:53:46", "remaining_time": "10:05:01"}
|
| 229 |
+
{"current_steps": 229, "total_steps": 333, "loss": 0.3847, "lr": 3.054333251050381e-05, "epoch": 2.060078607523863, "percentage": 68.77, "elapsed_time": "21:59:27", "remaining_time": "9:59:13"}
|
| 230 |
+
{"current_steps": 230, "total_steps": 333, "loss": 0.3708, "lr": 3.0017050343336532e-05, "epoch": 2.069062324536777, "percentage": 69.07, "elapsed_time": "22:05:12", "remaining_time": "9:53:27"}
|
| 231 |
+
{"current_steps": 231, "total_steps": 333, "loss": 0.3722, "lr": 2.949369935466122e-05, "epoch": 2.0780460415496913, "percentage": 69.37, "elapsed_time": "22:11:13", "remaining_time": "9:47:48"}
|
| 232 |
+
{"current_steps": 232, "total_steps": 333, "loss": 0.375, "lr": 2.8973337320338337e-05, "epoch": 2.0870297585626054, "percentage": 69.67, "elapsed_time": "22:17:00", "remaining_time": "9:42:03"}
|
| 233 |
+
{"current_steps": 233, "total_steps": 333, "loss": 0.3613, "lr": 2.845602168625973e-05, "epoch": 2.0960134755755195, "percentage": 69.97, "elapsed_time": "22:22:53", "remaining_time": "9:36:20"}
|
| 234 |
+
{"current_steps": 234, "total_steps": 333, "loss": 0.376, "lr": 2.7941809562006803e-05, "epoch": 2.1049971925884337, "percentage": 70.27, "elapsed_time": "22:28:20", "remaining_time": "9:30:27"}
|
| 235 |
+
{"current_steps": 235, "total_steps": 333, "loss": 0.3741, "lr": 2.743075771454589e-05, "epoch": 2.1139809096013478, "percentage": 70.57, "elapsed_time": "22:34:11", "remaining_time": "9:24:43"}
|
| 236 |
+
{"current_steps": 236, "total_steps": 333, "loss": 0.3702, "lr": 2.6922922561961362e-05, "epoch": 2.1229646266142614, "percentage": 70.87, "elapsed_time": "22:39:59", "remaining_time": "9:18:58"}
|
| 237 |
+
{"current_steps": 237, "total_steps": 333, "loss": 0.3776, "lr": 2.6418360167227277e-05, "epoch": 2.1319483436271756, "percentage": 71.17, "elapsed_time": "22:45:53", "remaining_time": "9:13:16"}
|
| 238 |
+
{"current_steps": 238, "total_steps": 333, "loss": 0.3675, "lr": 2.5917126232018344e-05, "epoch": 2.1409320606400897, "percentage": 71.47, "elapsed_time": "22:51:37", "remaining_time": "9:07:29"}
|
| 239 |
+
{"current_steps": 239, "total_steps": 333, "loss": 0.3694, "lr": 2.54192760905606e-05, "epoch": 2.149915777653004, "percentage": 71.77, "elapsed_time": "22:57:19", "remaining_time": "9:01:42"}
|
| 240 |
+
{"current_steps": 240, "total_steps": 333, "loss": 0.3717, "lr": 2.4924864703522748e-05, "epoch": 2.158899494665918, "percentage": 72.07, "elapsed_time": "23:02:54", "remaining_time": "8:55:52"}
|
| 241 |
+
{"current_steps": 241, "total_steps": 333, "loss": 0.3619, "lr": 2.443394665194875e-05, "epoch": 2.167883211678832, "percentage": 72.37, "elapsed_time": "23:08:43", "remaining_time": "8:50:08"}
|
| 242 |
+
{"current_steps": 242, "total_steps": 333, "loss": 0.3842, "lr": 2.3946576131232258e-05, "epoch": 2.176866928691746, "percentage": 72.67, "elapsed_time": "23:14:30", "remaining_time": "8:44:23"}
|
| 243 |
+
{"current_steps": 243, "total_steps": 333, "loss": 0.3897, "lr": 2.3462806945133682e-05, "epoch": 2.1858506457046603, "percentage": 72.97, "elapsed_time": "23:20:09", "remaining_time": "8:38:34"}
|
| 244 |
+
{"current_steps": 244, "total_steps": 333, "loss": 0.3652, "lr": 2.2982692499840452e-05, "epoch": 2.1948343627175744, "percentage": 73.27, "elapsed_time": "23:25:33", "remaining_time": "8:32:40"}
|
| 245 |
+
{"current_steps": 245, "total_steps": 333, "loss": 0.369, "lr": 2.2506285798071218e-05, "epoch": 2.2038180797304885, "percentage": 73.57, "elapsed_time": "23:31:11", "remaining_time": "8:26:52"}
|
| 246 |
+
{"current_steps": 246, "total_steps": 333, "loss": 0.3639, "lr": 2.203363943322452e-05, "epoch": 2.2128017967434026, "percentage": 73.87, "elapsed_time": "23:36:50", "remaining_time": "8:21:04"}
|
| 247 |
+
{"current_steps": 247, "total_steps": 333, "loss": 0.3742, "lr": 2.1564805583572732e-05, "epoch": 2.2217855137563167, "percentage": 74.17, "elapsed_time": "23:42:32", "remaining_time": "8:15:17"}
|
| 248 |
+
{"current_steps": 248, "total_steps": 333, "loss": 0.3607, "lr": 2.109983600650176e-05, "epoch": 2.230769230769231, "percentage": 74.47, "elapsed_time": "23:48:05", "remaining_time": "8:09:28"}
|
| 249 |
+
{"current_steps": 249, "total_steps": 333, "loss": 0.3693, "lr": 2.0638782032797214e-05, "epoch": 2.239752947782145, "percentage": 74.77, "elapsed_time": "23:53:49", "remaining_time": "8:03:41"}
|
| 250 |
+
{"current_steps": 250, "total_steps": 333, "loss": 0.369, "lr": 2.018169456097774e-05, "epoch": 2.248736664795059, "percentage": 75.08, "elapsed_time": "23:59:28", "remaining_time": "7:57:54"}
|
| 251 |
+
{"current_steps": 251, "total_steps": 333, "loss": 0.3738, "lr": 1.9728624051676018e-05, "epoch": 2.257720381807973, "percentage": 75.38, "elapsed_time": "1 day, 0:05:23", "remaining_time": "7:52:12"}
|
| 252 |
+
{"current_steps": 252, "total_steps": 333, "loss": 0.3798, "lr": 1.927962052206808e-05, "epoch": 2.2667040988208873, "percentage": 75.68, "elapsed_time": "1 day, 0:11:24", "remaining_time": "7:46:31"}
|
| 253 |
+
{"current_steps": 253, "total_steps": 333, "loss": 0.3666, "lr": 1.8834733540351643e-05, "epoch": 2.2756878158338014, "percentage": 75.98, "elapsed_time": "1 day, 0:16:56", "remaining_time": "7:40:41"}
|
| 254 |
+
{"current_steps": 254, "total_steps": 333, "loss": 0.3853, "lr": 1.8394012220273954e-05, "epoch": 2.2846715328467155, "percentage": 76.28, "elapsed_time": "1 day, 0:22:49", "remaining_time": "7:34:58"}
|
| 255 |
+
{"current_steps": 255, "total_steps": 333, "loss": 0.3701, "lr": 1.7957505215709848e-05, "epoch": 2.293655249859629, "percentage": 76.58, "elapsed_time": "1 day, 0:28:45", "remaining_time": "7:29:16"}
|
| 256 |
+
{"current_steps": 256, "total_steps": 333, "loss": 0.3786, "lr": 1.7525260715290535e-05, "epoch": 2.3026389668725433, "percentage": 76.88, "elapsed_time": "1 day, 0:34:20", "remaining_time": "7:23:27"}
|
| 257 |
+
{"current_steps": 257, "total_steps": 333, "loss": 0.3772, "lr": 1.7097326437083794e-05, "epoch": 2.3116226838854574, "percentage": 77.18, "elapsed_time": "1 day, 0:40:11", "remaining_time": "7:17:43"}
|
| 258 |
+
{"current_steps": 258, "total_steps": 333, "loss": 0.3641, "lr": 1.6673749623326064e-05, "epoch": 2.3206064008983716, "percentage": 77.48, "elapsed_time": "1 day, 0:46:02", "remaining_time": "7:11:59"}
|
| 259 |
+
{"current_steps": 259, "total_steps": 333, "loss": 0.3832, "lr": 1.6254577035207113e-05, "epoch": 2.3295901179112857, "percentage": 77.78, "elapsed_time": "1 day, 0:51:52", "remaining_time": "7:06:15"}
|
| 260 |
+
{"current_steps": 260, "total_steps": 333, "loss": 0.3587, "lr": 1.5839854947707754e-05, "epoch": 2.3385738349242, "percentage": 78.08, "elapsed_time": "1 day, 0:57:25", "remaining_time": "7:00:25"}
|
| 261 |
+
{"current_steps": 261, "total_steps": 333, "loss": 0.3791, "lr": 1.5429629144491303e-05, "epoch": 2.347557551937114, "percentage": 78.38, "elapsed_time": "1 day, 1:02:56", "remaining_time": "6:54:36"}
|
| 262 |
+
{"current_steps": 262, "total_steps": 333, "loss": 0.3761, "lr": 1.5023944912849248e-05, "epoch": 2.356541268950028, "percentage": 78.68, "elapsed_time": "1 day, 1:08:33", "remaining_time": "6:48:48"}
|
| 263 |
+
{"current_steps": 263, "total_steps": 333, "loss": 0.3717, "lr": 1.462284703870168e-05, "epoch": 2.365524985962942, "percentage": 78.98, "elapsed_time": "1 day, 1:14:26", "remaining_time": "6:43:04"}
|
| 264 |
+
{"current_steps": 264, "total_steps": 333, "loss": 0.3757, "lr": 1.4226379801653136e-05, "epoch": 2.3745087029758563, "percentage": 79.28, "elapsed_time": "1 day, 1:20:05", "remaining_time": "6:37:17"}
|
| 265 |
+
{"current_steps": 265, "total_steps": 333, "loss": 0.3765, "lr": 1.3834586970104307e-05, "epoch": 2.3834924199887704, "percentage": 79.58, "elapsed_time": "1 day, 1:25:56", "remaining_time": "6:31:33"}
|
| 266 |
+
{"current_steps": 266, "total_steps": 333, "loss": 0.3795, "lr": 1.3447511796420162e-05, "epoch": 2.3924761370016845, "percentage": 79.88, "elapsed_time": "1 day, 1:31:44", "remaining_time": "6:25:48"}
|
| 267 |
+
{"current_steps": 267, "total_steps": 333, "loss": 0.3659, "lr": 1.306519701215506e-05, "epoch": 2.4014598540145986, "percentage": 80.18, "elapsed_time": "1 day, 1:37:33", "remaining_time": "6:20:04"}
|
| 268 |
+
{"current_steps": 268, "total_steps": 333, "loss": 0.3778, "lr": 1.2687684823335395e-05, "epoch": 2.4104435710275127, "percentage": 80.48, "elapsed_time": "1 day, 1:43:31", "remaining_time": "6:14:21"}
|
| 269 |
+
{"current_steps": 269, "total_steps": 333, "loss": 0.3817, "lr": 1.2315016905800158e-05, "epoch": 2.419427288040427, "percentage": 80.78, "elapsed_time": "1 day, 1:49:13", "remaining_time": "6:08:35"}
|
| 270 |
+
{"current_steps": 270, "total_steps": 333, "loss": 0.361, "lr": 1.1947234400600164e-05, "epoch": 2.428411005053341, "percentage": 81.08, "elapsed_time": "1 day, 1:54:54", "remaining_time": "6:02:48"}
|
| 271 |
+
{"current_steps": 271, "total_steps": 333, "loss": 0.3642, "lr": 1.1584377909456147e-05, "epoch": 2.437394722066255, "percentage": 81.38, "elapsed_time": "1 day, 2:00:54", "remaining_time": "5:57:06"}
|
| 272 |
+
{"current_steps": 272, "total_steps": 333, "loss": 0.3727, "lr": 1.1226487490276591e-05, "epoch": 2.446378439079169, "percentage": 81.68, "elapsed_time": "1 day, 2:06:51", "remaining_time": "5:51:23"}
|
| 273 |
+
{"current_steps": 273, "total_steps": 333, "loss": 0.3647, "lr": 1.087360265273545e-05, "epoch": 2.4553621560920833, "percentage": 81.98, "elapsed_time": "1 day, 2:12:23", "remaining_time": "5:45:34"}
|
| 274 |
+
{"current_steps": 274, "total_steps": 333, "loss": 0.383, "lr": 1.0525762353910433e-05, "epoch": 2.464345873104997, "percentage": 82.28, "elapsed_time": "1 day, 2:18:07", "remaining_time": "5:39:48"}
|
| 275 |
+
{"current_steps": 275, "total_steps": 333, "loss": 0.3737, "lr": 1.018300499398232e-05, "epoch": 2.473329590117911, "percentage": 82.58, "elapsed_time": "1 day, 2:23:43", "remaining_time": "5:34:01"}
|
| 276 |
+
{"current_steps": 276, "total_steps": 333, "loss": 0.3781, "lr": 9.8453684119957e-06, "epoch": 2.482313307130825, "percentage": 82.88, "elapsed_time": "1 day, 2:29:43", "remaining_time": "5:28:18"}
|
| 277 |
+
{"current_steps": 277, "total_steps": 333, "loss": 0.3589, "lr": 9.512889881681736e-06, "epoch": 2.4912970241437393, "percentage": 83.18, "elapsed_time": "1 day, 2:35:29", "remaining_time": "5:22:33"}
|
| 278 |
+
{"current_steps": 278, "total_steps": 333, "loss": 0.36, "lr": 9.185606107343261e-06, "epoch": 2.5002807411566534, "percentage": 83.48, "elapsed_time": "1 day, 2:40:56", "remaining_time": "5:16:43"}
|
| 279 |
+
{"current_steps": 279, "total_steps": 333, "loss": 0.3706, "lr": 8.863553219802784e-06, "epoch": 2.5092644581695676, "percentage": 83.78, "elapsed_time": "1 day, 2:46:29", "remaining_time": "5:10:55"}
|
| 280 |
+
{"current_steps": 280, "total_steps": 333, "loss": 0.3807, "lr": 8.546766772413786e-06, "epoch": 2.5182481751824817, "percentage": 84.08, "elapsed_time": "1 day, 2:52:12", "remaining_time": "5:05:10"}
|
| 281 |
+
{"current_steps": 281, "total_steps": 333, "loss": 0.3637, "lr": 8.23528173713578e-06, "epoch": 2.527231892195396, "percentage": 84.38, "elapsed_time": "1 day, 2:57:54", "remaining_time": "4:59:23"}
|
| 282 |
+
{"current_steps": 282, "total_steps": 333, "loss": 0.3667, "lr": 7.929132500673536e-06, "epoch": 2.53621560920831, "percentage": 84.68, "elapsed_time": "1 day, 3:03:42", "remaining_time": "4:53:38"}
|
| 283 |
+
{"current_steps": 283, "total_steps": 333, "loss": 0.3821, "lr": 7.628352860680906e-06, "epoch": 2.545199326221224, "percentage": 84.98, "elapsed_time": "1 day, 3:09:22", "remaining_time": "4:47:52"}
|
| 284 |
+
{"current_steps": 284, "total_steps": 333, "loss": 0.3583, "lr": 7.332976022029765e-06, "epoch": 2.554183043234138, "percentage": 85.29, "elapsed_time": "1 day, 3:14:57", "remaining_time": "4:42:05"}
|
| 285 |
+
{"current_steps": 285, "total_steps": 333, "loss": 0.387, "lr": 7.0430345931442495e-06, "epoch": 2.5631667602470523, "percentage": 85.59, "elapsed_time": "1 day, 3:20:36", "remaining_time": "4:36:18"}
|
| 286 |
+
{"current_steps": 286, "total_steps": 333, "loss": 0.3747, "lr": 6.758560582400965e-06, "epoch": 2.5721504772599664, "percentage": 85.89, "elapsed_time": "1 day, 3:26:18", "remaining_time": "4:30:32"}
|
| 287 |
+
{"current_steps": 287, "total_steps": 333, "loss": 0.3757, "lr": 6.479585394595375e-06, "epoch": 2.5811341942728805, "percentage": 86.19, "elapsed_time": "1 day, 3:31:55", "remaining_time": "4:24:46"}
|
| 288 |
+
{"current_steps": 288, "total_steps": 333, "loss": 0.3641, "lr": 6.206139827474829e-06, "epoch": 2.5901179112857946, "percentage": 86.49, "elapsed_time": "1 day, 3:37:42", "remaining_time": "4:19:01"}
|
| 289 |
+
{"current_steps": 289, "total_steps": 333, "loss": 0.3646, "lr": 5.938254068338624e-06, "epoch": 2.5991016282987087, "percentage": 86.79, "elapsed_time": "1 day, 3:43:23", "remaining_time": "4:13:14"}
|
| 290 |
+
{"current_steps": 290, "total_steps": 333, "loss": 0.381, "lr": 5.675957690705446e-06, "epoch": 2.608085345311623, "percentage": 87.09, "elapsed_time": "1 day, 3:49:20", "remaining_time": "4:07:31"}
|
| 291 |
+
{"current_steps": 291, "total_steps": 333, "loss": 0.3748, "lr": 5.419279651048566e-06, "epoch": 2.6170690623245365, "percentage": 87.39, "elapsed_time": "1 day, 3:54:58", "remaining_time": "4:01:44"}
|
| 292 |
+
{"current_steps": 292, "total_steps": 333, "loss": 0.3605, "lr": 5.168248285599177e-06, "epoch": 2.626052779337451, "percentage": 87.69, "elapsed_time": "1 day, 4:00:58", "remaining_time": "3:56:01"}
|
| 293 |
+
{"current_steps": 293, "total_steps": 333, "loss": 0.3778, "lr": 4.922891307218158e-06, "epoch": 2.6350364963503647, "percentage": 87.99, "elapsed_time": "1 day, 4:06:47", "remaining_time": "3:50:16"}
|
| 294 |
+
{"current_steps": 294, "total_steps": 333, "loss": 0.3748, "lr": 4.6832358023367316e-06, "epoch": 2.6440202133632793, "percentage": 88.29, "elapsed_time": "1 day, 4:12:28", "remaining_time": "3:44:30"}
|
| 295 |
+
{"current_steps": 295, "total_steps": 333, "loss": 0.366, "lr": 4.449308227966143e-06, "epoch": 2.653003930376193, "percentage": 88.59, "elapsed_time": "1 day, 4:18:16", "remaining_time": "3:38:45"}
|
| 296 |
+
{"current_steps": 296, "total_steps": 333, "loss": 0.3757, "lr": 4.221134408777029e-06, "epoch": 2.661987647389107, "percentage": 88.89, "elapsed_time": "1 day, 4:24:06", "remaining_time": "3:33:00"}
|
| 297 |
+
{"current_steps": 297, "total_steps": 333, "loss": 0.3727, "lr": 3.998739534248389e-06, "epoch": 2.670971364402021, "percentage": 89.19, "elapsed_time": "1 day, 4:29:55", "remaining_time": "3:27:15"}
|
| 298 |
+
{"current_steps": 298, "total_steps": 333, "loss": 0.3719, "lr": 3.782148155886801e-06, "epoch": 2.6799550814149353, "percentage": 89.49, "elapsed_time": "1 day, 4:35:48", "remaining_time": "3:21:31"}
|
| 299 |
+
{"current_steps": 299, "total_steps": 333, "loss": 0.3649, "lr": 3.5713841845160227e-06, "epoch": 2.6889387984278494, "percentage": 89.79, "elapsed_time": "1 day, 4:41:37", "remaining_time": "3:15:46"}
|
| 300 |
+
{"current_steps": 300, "total_steps": 333, "loss": 0.3638, "lr": 3.366470887637346e-06, "epoch": 2.6979225154407636, "percentage": 90.09, "elapsed_time": "1 day, 4:47:22", "remaining_time": "3:10:00"}
|
| 301 |
+
{"current_steps": 301, "total_steps": 333, "loss": 0.3732, "lr": 3.1674308868609408e-06, "epoch": 2.7069062324536777, "percentage": 90.39, "elapsed_time": "1 day, 4:53:08", "remaining_time": "3:04:15"}
|
| 302 |
+
{"current_steps": 302, "total_steps": 333, "loss": 0.3798, "lr": 2.9742861554085396e-06, "epoch": 2.715889949466592, "percentage": 90.69, "elapsed_time": "1 day, 4:59:06", "remaining_time": "2:58:31"}
|
| 303 |
+
{"current_steps": 303, "total_steps": 333, "loss": 0.3666, "lr": 2.7870580156876457e-06, "epoch": 2.724873666479506, "percentage": 90.99, "elapsed_time": "1 day, 5:04:50", "remaining_time": "2:52:45"}
|
| 304 |
+
{"current_steps": 304, "total_steps": 333, "loss": 0.3622, "lr": 2.6057671369376755e-06, "epoch": 2.73385738349242, "percentage": 91.29, "elapsed_time": "1 day, 5:10:25", "remaining_time": "2:46:58"}
|
| 305 |
+
{"current_steps": 305, "total_steps": 333, "loss": 0.3715, "lr": 2.4304335329481117e-06, "epoch": 2.742841100505334, "percentage": 91.59, "elapsed_time": "1 day, 5:15:46", "remaining_time": "2:41:11"}
|
| 306 |
+
{"current_steps": 306, "total_steps": 333, "loss": 0.3631, "lr": 2.2610765598490875e-06, "epoch": 2.7518248175182483, "percentage": 91.89, "elapsed_time": "1 day, 5:21:36", "remaining_time": "2:35:26"}
|
| 307 |
+
{"current_steps": 307, "total_steps": 333, "loss": 0.3733, "lr": 2.097714913974531e-06, "epoch": 2.7608085345311624, "percentage": 92.19, "elapsed_time": "1 day, 5:27:15", "remaining_time": "2:29:40"}
|
| 308 |
+
{"current_steps": 308, "total_steps": 333, "loss": 0.3563, "lr": 1.940366629798168e-06, "epoch": 2.7697922515440765, "percentage": 92.49, "elapsed_time": "1 day, 5:32:51", "remaining_time": "2:23:54"}
|
| 309 |
+
{"current_steps": 309, "total_steps": 333, "loss": 0.388, "lr": 1.7890490779426058e-06, "epoch": 2.7787759685569906, "percentage": 92.79, "elapsed_time": "1 day, 5:38:46", "remaining_time": "2:18:09"}
|
| 310 |
+
{"current_steps": 310, "total_steps": 333, "loss": 0.3562, "lr": 1.6437789632616797e-06, "epoch": 2.7877596855699043, "percentage": 93.09, "elapsed_time": "1 day, 5:44:12", "remaining_time": "2:12:22"}
|
| 311 |
+
{"current_steps": 311, "total_steps": 333, "loss": 0.3765, "lr": 1.504572322996265e-06, "epoch": 2.796743402582819, "percentage": 93.39, "elapsed_time": "1 day, 5:49:55", "remaining_time": "2:06:37"}
|
| 312 |
+
{"current_steps": 312, "total_steps": 333, "loss": 0.3744, "lr": 1.371444525003882e-06, "epoch": 2.8057271195957325, "percentage": 93.69, "elapsed_time": "1 day, 5:55:32", "remaining_time": "2:00:51"}
|
| 313 |
+
{"current_steps": 313, "total_steps": 333, "loss": 0.367, "lr": 1.2444102660621238e-06, "epoch": 2.814710836608647, "percentage": 93.99, "elapsed_time": "1 day, 6:01:33", "remaining_time": "1:55:06"}
|
| 314 |
+
{"current_steps": 314, "total_steps": 333, "loss": 0.3731, "lr": 1.1234835702461861e-06, "epoch": 2.8236945536215607, "percentage": 94.29, "elapsed_time": "1 day, 6:07:31", "remaining_time": "1:49:22"}
|
| 315 |
+
{"current_steps": 315, "total_steps": 333, "loss": 0.3676, "lr": 1.0086777873806807e-06, "epoch": 2.832678270634475, "percentage": 94.59, "elapsed_time": "1 day, 6:13:15", "remaining_time": "1:43:36"}
|
| 316 |
+
{"current_steps": 316, "total_steps": 333, "loss": 0.3709, "lr": 9.00005591565833e-07, "epoch": 2.841661987647389, "percentage": 94.89, "elapsed_time": "1 day, 6:19:11", "remaining_time": "1:37:52"}
|
| 317 |
+
{"current_steps": 317, "total_steps": 333, "loss": 0.3776, "lr": 7.974789797783608e-07, "epoch": 2.850645704660303, "percentage": 95.2, "elapsed_time": "1 day, 6:24:58", "remaining_time": "1:32:06"}
|
| 318 |
+
{"current_steps": 318, "total_steps": 333, "loss": 0.3717, "lr": 7.01109270547026e-07, "epoch": 2.859629421673217, "percentage": 95.5, "elapsed_time": "1 day, 6:30:51", "remaining_time": "1:26:21"}
|
| 319 |
+
{"current_steps": 319, "total_steps": 333, "loss": 0.3679, "lr": 6.109071027031233e-07, "epoch": 2.8686131386861313, "percentage": 95.8, "elapsed_time": "1 day, 6:36:33", "remaining_time": "1:20:36"}
|
| 320 |
+
{"current_steps": 320, "total_steps": 333, "loss": 0.3753, "lr": 5.268824342059822e-07, "epoch": 2.8775968556990454, "percentage": 96.1, "elapsed_time": "1 day, 6:42:32", "remaining_time": "1:14:51"}
|
| 321 |
+
{"current_steps": 321, "total_steps": 333, "loss": 0.3693, "lr": 4.4904454104367007e-07, "epoch": 2.8865805727119596, "percentage": 96.4, "elapsed_time": "1 day, 6:48:35", "remaining_time": "1:09:06"}
|
| 322 |
+
{"current_steps": 322, "total_steps": 333, "loss": 0.3683, "lr": 3.7740201620894e-07, "epoch": 2.8955642897248737, "percentage": 96.7, "elapsed_time": "1 day, 6:54:11", "remaining_time": "1:03:20"}
|
| 323 |
+
{"current_steps": 323, "total_steps": 333, "loss": 0.3729, "lr": 3.119627687506124e-07, "epoch": 2.904548006737788, "percentage": 97.0, "elapsed_time": "1 day, 6:59:54", "remaining_time": "0:57:34"}
|
| 324 |
+
{"current_steps": 324, "total_steps": 333, "loss": 0.3664, "lr": 2.527340229004407e-07, "epoch": 2.913531723750702, "percentage": 97.3, "elapsed_time": "1 day, 7:05:38", "remaining_time": "0:51:49"}
|
| 325 |
+
{"current_steps": 325, "total_steps": 333, "loss": 0.3773, "lr": 1.9972231727558538e-07, "epoch": 2.922515440763616, "percentage": 97.6, "elapsed_time": "1 day, 7:11:17", "remaining_time": "0:46:03"}
|
| 326 |
+
{"current_steps": 326, "total_steps": 333, "loss": 0.3618, "lr": 1.529335041567867e-07, "epoch": 2.93149915777653, "percentage": 97.9, "elapsed_time": "1 day, 7:17:07", "remaining_time": "0:40:18"}
|
| 327 |
+
{"current_steps": 327, "total_steps": 333, "loss": 0.3598, "lr": 1.1237274884227121e-07, "epoch": 2.9404828747894443, "percentage": 98.2, "elapsed_time": "1 day, 7:23:00", "remaining_time": "0:34:33"}
|
| 328 |
+
{"current_steps": 328, "total_steps": 333, "loss": 0.3728, "lr": 7.804452907755089e-08, "epoch": 2.9494665918023584, "percentage": 98.5, "elapsed_time": "1 day, 7:28:47", "remaining_time": "0:28:47"}
|
| 329 |
+
{"current_steps": 329, "total_steps": 333, "loss": 0.3682, "lr": 4.9952634561082644e-08, "epoch": 2.958450308815272, "percentage": 98.8, "elapsed_time": "1 day, 7:34:37", "remaining_time": "0:23:02"}
|
| 330 |
+
{"current_steps": 330, "total_steps": 333, "loss": 0.3708, "lr": 2.810016652591411e-08, "epoch": 2.9674340258281866, "percentage": 99.1, "elapsed_time": "1 day, 7:40:11", "remaining_time": "0:17:16"}
|
| 331 |
+
{"current_steps": 331, "total_steps": 333, "loss": 0.3737, "lr": 1.248953739730298e-08, "epoch": 2.9764177428411003, "percentage": 99.4, "elapsed_time": "1 day, 7:46:18", "remaining_time": "0:11:31"}
|
| 332 |
+
{"current_steps": 332, "total_steps": 333, "loss": 0.3671, "lr": 3.1224705263979394e-09, "epoch": 2.985401459854015, "percentage": 99.7, "elapsed_time": "1 day, 7:52:05", "remaining_time": "0:05:45"}
|
| 333 |
+
{"current_steps": 333, "total_steps": 333, "loss": 0.3706, "lr": 0.0, "epoch": 2.9943851768669285, "percentage": 100.0, "elapsed_time": "1 day, 7:57:59", "remaining_time": "0:00:00"}
|
| 334 |
+
{"current_steps": 333, "total_steps": 333, "epoch": 2.9943851768669285, "percentage": 100.0, "elapsed_time": "1 day, 7:59:33", "remaining_time": "0:00:00"}
|