Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b354fffd7b84e79ac895bc8a1117f46139d240975a924c31cff85f21174fb0b7
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:603e7982ef56e879785c28122dd2cfcccbb6e1d5dafd78a841530357816d2f12
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a5a3a686c96166a8f129125ee394d5e5b0f323682f7f58ed26439fb0b6b31dac
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:198cc902e4eb81777ae407cb42df9ea1c16386f0183fda869ab0f639d8a0c09d
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -212,3 +212,102 @@
|
|
| 212 |
{"current_steps": 212, "total_steps": 312, "loss": 0.3009, "lr": 1.132232521764884e-05, "epoch": 2.0319488817891376, "percentage": 67.95, "elapsed_time": "1:54:43", "remaining_time": "0:54:07"}
|
| 213 |
{"current_steps": 213, "total_steps": 312, "loss": 0.3387, "lr": 1.1120698719390362e-05, "epoch": 2.0415335463258786, "percentage": 68.27, "elapsed_time": "1:55:18", "remaining_time": "0:53:35"}
|
| 214 |
{"current_steps": 214, "total_steps": 312, "loss": 0.3105, "lr": 1.0920190005209066e-05, "epoch": 2.0511182108626196, "percentage": 68.59, "elapsed_time": "1:55:50", "remaining_time": "0:53:02"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 212 |
{"current_steps": 212, "total_steps": 312, "loss": 0.3009, "lr": 1.132232521764884e-05, "epoch": 2.0319488817891376, "percentage": 67.95, "elapsed_time": "1:54:43", "remaining_time": "0:54:07"}
|
| 213 |
{"current_steps": 213, "total_steps": 312, "loss": 0.3387, "lr": 1.1120698719390362e-05, "epoch": 2.0415335463258786, "percentage": 68.27, "elapsed_time": "1:55:18", "remaining_time": "0:53:35"}
|
| 214 |
{"current_steps": 214, "total_steps": 312, "loss": 0.3105, "lr": 1.0920190005209066e-05, "epoch": 2.0511182108626196, "percentage": 68.59, "elapsed_time": "1:55:50", "remaining_time": "0:53:02"}
|
| 215 |
+
{"current_steps": 215, "total_steps": 312, "loss": 0.2901, "lr": 1.0720824316443321e-05, "epoch": 2.060702875399361, "percentage": 68.91, "elapsed_time": "1:56:25", "remaining_time": "0:52:31"}
|
| 216 |
+
{"current_steps": 216, "total_steps": 312, "loss": 0.3493, "lr": 1.0522626750540029e-05, "epoch": 2.070287539936102, "percentage": 69.23, "elapsed_time": "1:56:53", "remaining_time": "0:51:57"}
|
| 217 |
+
{"current_steps": 217, "total_steps": 312, "loss": 0.2985, "lr": 1.0325622257895205e-05, "epoch": 2.0798722044728435, "percentage": 69.55, "elapsed_time": "1:57:23", "remaining_time": "0:51:23"}
|
| 218 |
+
{"current_steps": 218, "total_steps": 312, "loss": 0.3166, "lr": 1.0129835638713064e-05, "epoch": 2.0894568690095845, "percentage": 69.87, "elapsed_time": "1:57:50", "remaining_time": "0:50:48"}
|
| 219 |
+
{"current_steps": 219, "total_steps": 312, "loss": 0.2843, "lr": 9.935291539884e-06, "epoch": 2.099041533546326, "percentage": 70.19, "elapsed_time": "1:58:25", "remaining_time": "0:50:17"}
|
| 220 |
+
{"current_steps": 220, "total_steps": 312, "loss": 0.3163, "lr": 9.74201445188188e-06, "epoch": 2.108626198083067, "percentage": 70.51, "elapsed_time": "1:58:54", "remaining_time": "0:49:43"}
|
| 221 |
+
{"current_steps": 221, "total_steps": 312, "loss": 0.3222, "lr": 9.550028705681024e-06, "epoch": 2.1182108626198084, "percentage": 70.83, "elapsed_time": "1:59:29", "remaining_time": "0:49:12"}
|
| 222 |
+
{"current_steps": 222, "total_steps": 312, "loss": 0.2909, "lr": 9.359358469693272e-06, "epoch": 2.1277955271565494, "percentage": 71.15, "elapsed_time": "1:59:56", "remaining_time": "0:48:37"}
|
| 223 |
+
{"current_steps": 223, "total_steps": 312, "loss": 0.3146, "lr": 9.170027746725487e-06, "epoch": 2.137380191693291, "percentage": 71.47, "elapsed_time": "2:00:32", "remaining_time": "0:48:06"}
|
| 224 |
+
{"current_steps": 224, "total_steps": 312, "loss": 0.3017, "lr": 8.982060370957953e-06, "epoch": 2.146964856230032, "percentage": 71.79, "elapsed_time": "2:01:02", "remaining_time": "0:47:33"}
|
| 225 |
+
{"current_steps": 225, "total_steps": 312, "loss": 0.3456, "lr": 8.795480004943946e-06, "epoch": 2.1565495207667733, "percentage": 72.12, "elapsed_time": "2:01:37", "remaining_time": "0:47:01"}
|
| 226 |
+
{"current_steps": 226, "total_steps": 312, "loss": 0.2761, "lr": 8.610310136630962e-06, "epoch": 2.1661341853035143, "percentage": 72.44, "elapsed_time": "2:02:10", "remaining_time": "0:46:29"}
|
| 227 |
+
{"current_steps": 227, "total_steps": 312, "loss": 0.302, "lr": 8.426574076403887e-06, "epoch": 2.1757188498402558, "percentage": 72.76, "elapsed_time": "2:02:37", "remaining_time": "0:45:54"}
|
| 228 |
+
{"current_steps": 228, "total_steps": 312, "loss": 0.338, "lr": 8.24429495415054e-06, "epoch": 2.1853035143769968, "percentage": 73.08, "elapsed_time": "2:03:10", "remaining_time": "0:45:22"}
|
| 229 |
+
{"current_steps": 229, "total_steps": 312, "loss": 0.3081, "lr": 8.063495716349929e-06, "epoch": 2.194888178913738, "percentage": 73.4, "elapsed_time": "2:03:39", "remaining_time": "0:44:49"}
|
| 230 |
+
{"current_steps": 230, "total_steps": 312, "loss": 0.3419, "lr": 7.884199123183604e-06, "epoch": 2.2044728434504792, "percentage": 73.72, "elapsed_time": "2:04:11", "remaining_time": "0:44:16"}
|
| 231 |
+
{"current_steps": 231, "total_steps": 312, "loss": 0.2749, "lr": 7.706427745670458e-06, "epoch": 2.2140575079872207, "percentage": 74.04, "elapsed_time": "2:04:46", "remaining_time": "0:43:44"}
|
| 232 |
+
{"current_steps": 232, "total_steps": 312, "loss": 0.3365, "lr": 7.530203962825331e-06, "epoch": 2.2236421725239617, "percentage": 74.36, "elapsed_time": "2:05:15", "remaining_time": "0:43:11"}
|
| 233 |
+
{"current_steps": 233, "total_steps": 312, "loss": 0.3282, "lr": 7.355549958841808e-06, "epoch": 2.2332268370607027, "percentage": 74.68, "elapsed_time": "2:05:51", "remaining_time": "0:42:40"}
|
| 234 |
+
{"current_steps": 234, "total_steps": 312, "loss": 0.2943, "lr": 7.182487720299518e-06, "epoch": 2.242811501597444, "percentage": 75.0, "elapsed_time": "2:06:20", "remaining_time": "0:42:06"}
|
| 235 |
+
{"current_steps": 235, "total_steps": 312, "loss": 0.3252, "lr": 7.01103903339633e-06, "epoch": 2.252396166134185, "percentage": 75.32, "elapsed_time": "2:06:52", "remaining_time": "0:41:34"}
|
| 236 |
+
{"current_steps": 236, "total_steps": 312, "loss": 0.2755, "lr": 6.841225481205749e-06, "epoch": 2.2619808306709266, "percentage": 75.64, "elapsed_time": "2:07:25", "remaining_time": "0:41:02"}
|
| 237 |
+
{"current_steps": 237, "total_steps": 312, "loss": 0.2962, "lr": 6.6730684409599225e-06, "epoch": 2.2715654952076676, "percentage": 75.96, "elapsed_time": "2:08:01", "remaining_time": "0:40:30"}
|
| 238 |
+
{"current_steps": 238, "total_steps": 312, "loss": 0.2951, "lr": 6.5065890813585145e-06, "epoch": 2.281150159744409, "percentage": 76.28, "elapsed_time": "2:08:37", "remaining_time": "0:39:59"}
|
| 239 |
+
{"current_steps": 239, "total_steps": 312, "loss": 0.317, "lr": 6.3418083599038624e-06, "epoch": 2.29073482428115, "percentage": 76.6, "elapsed_time": "2:09:10", "remaining_time": "0:39:27"}
|
| 240 |
+
{"current_steps": 240, "total_steps": 312, "loss": 0.2881, "lr": 6.178747020262708e-06, "epoch": 2.3003194888178915, "percentage": 76.92, "elapsed_time": "2:09:40", "remaining_time": "0:38:54"}
|
| 241 |
+
{"current_steps": 241, "total_steps": 312, "loss": 0.2595, "lr": 6.017425589654853e-06, "epoch": 2.3099041533546325, "percentage": 77.24, "elapsed_time": "2:10:13", "remaining_time": "0:38:21"}
|
| 242 |
+
{"current_steps": 242, "total_steps": 312, "loss": 0.326, "lr": 5.857864376269051e-06, "epoch": 2.319488817891374, "percentage": 77.56, "elapsed_time": "2:10:45", "remaining_time": "0:37:49"}
|
| 243 |
+
{"current_steps": 243, "total_steps": 312, "loss": 0.2744, "lr": 5.700083466706494e-06, "epoch": 2.329073482428115, "percentage": 77.88, "elapsed_time": "2:11:16", "remaining_time": "0:37:16"}
|
| 244 |
+
{"current_steps": 244, "total_steps": 312, "loss": 0.3105, "lr": 5.544102723452171e-06, "epoch": 2.3386581469648564, "percentage": 78.21, "elapsed_time": "2:11:47", "remaining_time": "0:36:43"}
|
| 245 |
+
{"current_steps": 245, "total_steps": 312, "loss": 0.316, "lr": 5.38994178237445e-06, "epoch": 2.3482428115015974, "percentage": 78.53, "elapsed_time": "2:12:22", "remaining_time": "0:36:11"}
|
| 246 |
+
{"current_steps": 246, "total_steps": 312, "loss": 0.3226, "lr": 5.237620050253189e-06, "epoch": 2.357827476038339, "percentage": 78.85, "elapsed_time": "2:12:56", "remaining_time": "0:35:40"}
|
| 247 |
+
{"current_steps": 247, "total_steps": 312, "loss": 0.2614, "lr": 5.087156702336689e-06, "epoch": 2.36741214057508, "percentage": 79.17, "elapsed_time": "2:13:26", "remaining_time": "0:35:07"}
|
| 248 |
+
{"current_steps": 248, "total_steps": 312, "loss": 0.3123, "lr": 4.938570679927784e-06, "epoch": 2.376996805111821, "percentage": 79.49, "elapsed_time": "2:14:01", "remaining_time": "0:34:35"}
|
| 249 |
+
{"current_steps": 249, "total_steps": 312, "loss": 0.3123, "lr": 4.791880687999382e-06, "epoch": 2.3865814696485623, "percentage": 79.81, "elapsed_time": "2:14:35", "remaining_time": "0:34:03"}
|
| 250 |
+
{"current_steps": 250, "total_steps": 312, "loss": 0.3176, "lr": 4.647105192839778e-06, "epoch": 2.3961661341853033, "percentage": 80.13, "elapsed_time": "2:15:06", "remaining_time": "0:33:30"}
|
| 251 |
+
{"current_steps": 251, "total_steps": 312, "loss": 0.3144, "lr": 4.504262419727983e-06, "epoch": 2.405750798722045, "percentage": 80.45, "elapsed_time": "2:15:34", "remaining_time": "0:32:56"}
|
| 252 |
+
{"current_steps": 252, "total_steps": 312, "loss": 0.34, "lr": 4.363370350639405e-06, "epoch": 2.415335463258786, "percentage": 80.77, "elapsed_time": "2:16:07", "remaining_time": "0:32:24"}
|
| 253 |
+
{"current_steps": 253, "total_steps": 312, "loss": 0.2955, "lr": 4.2244467219821806e-06, "epoch": 2.4249201277955272, "percentage": 81.09, "elapsed_time": "2:16:36", "remaining_time": "0:31:51"}
|
| 254 |
+
{"current_steps": 254, "total_steps": 312, "loss": 0.283, "lr": 4.087509022364382e-06, "epoch": 2.4345047923322682, "percentage": 81.41, "elapsed_time": "2:17:08", "remaining_time": "0:31:18"}
|
| 255 |
+
{"current_steps": 255, "total_steps": 312, "loss": 0.3177, "lr": 3.952574490392443e-06, "epoch": 2.4440894568690097, "percentage": 81.73, "elapsed_time": "2:17:43", "remaining_time": "0:30:47"}
|
| 256 |
+
{"current_steps": 256, "total_steps": 312, "loss": 0.302, "lr": 3.819660112501053e-06, "epoch": 2.4536741214057507, "percentage": 82.05, "elapsed_time": "2:18:16", "remaining_time": "0:30:14"}
|
| 257 |
+
{"current_steps": 257, "total_steps": 312, "loss": 0.302, "lr": 3.6887826208147968e-06, "epoch": 2.463258785942492, "percentage": 82.37, "elapsed_time": "2:18:47", "remaining_time": "0:29:42"}
|
| 258 |
+
{"current_steps": 258, "total_steps": 312, "loss": 0.2646, "lr": 3.5599584910418037e-06, "epoch": 2.472843450479233, "percentage": 82.69, "elapsed_time": "2:19:18", "remaining_time": "0:29:09"}
|
| 259 |
+
{"current_steps": 259, "total_steps": 312, "loss": 0.3084, "lr": 3.433203940399672e-06, "epoch": 2.4824281150159746, "percentage": 83.01, "elapsed_time": "2:19:48", "remaining_time": "0:28:36"}
|
| 260 |
+
{"current_steps": 260, "total_steps": 312, "loss": 0.3469, "lr": 3.3085349255739475e-06, "epoch": 2.4920127795527156, "percentage": 83.33, "elapsed_time": "2:20:21", "remaining_time": "0:28:04"}
|
| 261 |
+
{"current_steps": 261, "total_steps": 312, "loss": 0.3093, "lr": 3.1859671407093984e-06, "epoch": 2.501597444089457, "percentage": 83.65, "elapsed_time": "2:20:54", "remaining_time": "0:27:32"}
|
| 262 |
+
{"current_steps": 262, "total_steps": 312, "loss": 0.2979, "lr": 3.0655160154343177e-06, "epoch": 2.511182108626198, "percentage": 83.97, "elapsed_time": "2:21:28", "remaining_time": "0:26:59"}
|
| 263 |
+
{"current_steps": 263, "total_steps": 312, "loss": 0.3047, "lr": 2.947196712918157e-06, "epoch": 2.520766773162939, "percentage": 84.29, "elapsed_time": "2:21:55", "remaining_time": "0:26:26"}
|
| 264 |
+
{"current_steps": 264, "total_steps": 312, "loss": 0.2969, "lr": 2.8310241279626784e-06, "epoch": 2.5303514376996805, "percentage": 84.62, "elapsed_time": "2:22:24", "remaining_time": "0:25:53"}
|
| 265 |
+
{"current_steps": 265, "total_steps": 312, "loss": 0.2981, "lr": 2.7170128851269084e-06, "epoch": 2.539936102236422, "percentage": 84.94, "elapsed_time": "2:22:54", "remaining_time": "0:25:20"}
|
| 266 |
+
{"current_steps": 266, "total_steps": 312, "loss": 0.3308, "lr": 2.6051773368860935e-06, "epoch": 2.549520766773163, "percentage": 85.26, "elapsed_time": "2:23:22", "remaining_time": "0:24:47"}
|
| 267 |
+
{"current_steps": 267, "total_steps": 312, "loss": 0.3134, "lr": 2.4955315618249263e-06, "epoch": 2.559105431309904, "percentage": 85.58, "elapsed_time": "2:23:50", "remaining_time": "0:24:14"}
|
| 268 |
+
{"current_steps": 268, "total_steps": 312, "loss": 0.2988, "lr": 2.38808936286524e-06, "epoch": 2.5686900958466454, "percentage": 85.9, "elapsed_time": "2:24:19", "remaining_time": "0:23:41"}
|
| 269 |
+
{"current_steps": 269, "total_steps": 312, "loss": 0.275, "lr": 2.2828642655284038e-06, "epoch": 2.5782747603833864, "percentage": 86.22, "elapsed_time": "2:24:49", "remaining_time": "0:23:09"}
|
| 270 |
+
{"current_steps": 270, "total_steps": 312, "loss": 0.2913, "lr": 2.1798695162326444e-06, "epoch": 2.587859424920128, "percentage": 86.54, "elapsed_time": "2:25:22", "remaining_time": "0:22:36"}
|
| 271 |
+
{"current_steps": 271, "total_steps": 312, "loss": 0.3142, "lr": 2.0791180806254975e-06, "epoch": 2.597444089456869, "percentage": 86.86, "elapsed_time": "2:25:53", "remaining_time": "0:22:04"}
|
| 272 |
+
{"current_steps": 272, "total_steps": 312, "loss": 0.2994, "lr": 1.9806226419516195e-06, "epoch": 2.6070287539936103, "percentage": 87.18, "elapsed_time": "2:26:23", "remaining_time": "0:21:31"}
|
| 273 |
+
{"current_steps": 273, "total_steps": 312, "loss": 0.3301, "lr": 1.8843955994561191e-06, "epoch": 2.6166134185303513, "percentage": 87.5, "elapsed_time": "2:26:57", "remaining_time": "0:20:59"}
|
| 274 |
+
{"current_steps": 274, "total_steps": 312, "loss": 0.3136, "lr": 1.790449066823683e-06, "epoch": 2.626198083067093, "percentage": 87.82, "elapsed_time": "2:27:31", "remaining_time": "0:20:27"}
|
| 275 |
+
{"current_steps": 275, "total_steps": 312, "loss": 0.3265, "lr": 1.6987948706536038e-06, "epoch": 2.635782747603834, "percentage": 88.14, "elapsed_time": "2:28:06", "remaining_time": "0:19:55"}
|
| 276 |
+
{"current_steps": 276, "total_steps": 312, "loss": 0.3116, "lr": 1.6094445489709886e-06, "epoch": 2.6453674121405752, "percentage": 88.46, "elapsed_time": "2:28:39", "remaining_time": "0:19:23"}
|
| 277 |
+
{"current_steps": 277, "total_steps": 312, "loss": 0.3081, "lr": 1.5224093497742654e-06, "epoch": 2.6549520766773163, "percentage": 88.78, "elapsed_time": "2:29:12", "remaining_time": "0:18:51"}
|
| 278 |
+
{"current_steps": 278, "total_steps": 312, "loss": 0.2914, "lr": 1.4377002296192233e-06, "epoch": 2.6645367412140573, "percentage": 89.1, "elapsed_time": "2:29:48", "remaining_time": "0:18:19"}
|
| 279 |
+
{"current_steps": 279, "total_steps": 312, "loss": 0.3398, "lr": 1.3553278522397162e-06, "epoch": 2.6741214057507987, "percentage": 89.42, "elapsed_time": "2:30:21", "remaining_time": "0:17:47"}
|
| 280 |
+
{"current_steps": 280, "total_steps": 312, "loss": 0.2895, "lr": 1.275302587205256e-06, "epoch": 2.68370607028754, "percentage": 89.74, "elapsed_time": "2:30:52", "remaining_time": "0:17:14"}
|
| 281 |
+
{"current_steps": 281, "total_steps": 312, "loss": 0.3205, "lr": 1.1976345086156193e-06, "epoch": 2.693290734824281, "percentage": 90.06, "elapsed_time": "2:31:22", "remaining_time": "0:16:41"}
|
| 282 |
+
{"current_steps": 282, "total_steps": 312, "loss": 0.307, "lr": 1.1223333938326486e-06, "epoch": 2.702875399361022, "percentage": 90.38, "elapsed_time": "2:31:56", "remaining_time": "0:16:09"}
|
| 283 |
+
{"current_steps": 283, "total_steps": 312, "loss": 0.2977, "lr": 1.0494087222494253e-06, "epoch": 2.7124600638977636, "percentage": 90.71, "elapsed_time": "2:32:31", "remaining_time": "0:15:37"}
|
| 284 |
+
{"current_steps": 284, "total_steps": 312, "loss": 0.2727, "lr": 9.788696740969295e-07, "epoch": 2.722044728434505, "percentage": 91.03, "elapsed_time": "2:33:04", "remaining_time": "0:15:05"}
|
| 285 |
+
{"current_steps": 285, "total_steps": 312, "loss": 0.3241, "lr": 9.107251292883856e-07, "epoch": 2.731629392971246, "percentage": 91.35, "elapsed_time": "2:33:37", "remaining_time": "0:14:33"}
|
| 286 |
+
{"current_steps": 286, "total_steps": 312, "loss": 0.2888, "lr": 8.44983666301391e-07, "epoch": 2.741214057507987, "percentage": 91.67, "elapsed_time": "2:34:10", "remaining_time": "0:14:00"}
|
| 287 |
+
{"current_steps": 287, "total_steps": 312, "loss": 0.3236, "lr": 7.816535610980103e-07, "epoch": 2.7507987220447285, "percentage": 91.99, "elapsed_time": "2:34:46", "remaining_time": "0:13:28"}
|
| 288 |
+
{"current_steps": 288, "total_steps": 312, "loss": 0.3293, "lr": 7.207427860829352e-07, "epoch": 2.7603833865814695, "percentage": 92.31, "elapsed_time": "2:35:13", "remaining_time": "0:12:56"}
|
| 289 |
+
{"current_steps": 289, "total_steps": 312, "loss": 0.2896, "lr": 6.622590090998727e-07, "epoch": 2.769968051118211, "percentage": 92.63, "elapsed_time": "2:35:42", "remaining_time": "0:12:23"}
|
| 290 |
+
{"current_steps": 290, "total_steps": 312, "loss": 0.2977, "lr": 6.062095924662625e-07, "epoch": 2.779552715654952, "percentage": 92.95, "elapsed_time": "2:36:16", "remaining_time": "0:11:51"}
|
| 291 |
+
{"current_steps": 291, "total_steps": 312, "loss": 0.3527, "lr": 5.526015920464689e-07, "epoch": 2.7891373801916934, "percentage": 93.27, "elapsed_time": "2:36:48", "remaining_time": "0:11:18"}
|
| 292 |
+
{"current_steps": 292, "total_steps": 312, "loss": 0.2575, "lr": 5.014417563635276e-07, "epoch": 2.7987220447284344, "percentage": 93.59, "elapsed_time": "2:37:17", "remaining_time": "0:10:46"}
|
| 293 |
+
{"current_steps": 293, "total_steps": 312, "loss": 0.3026, "lr": 4.5273652574961745e-07, "epoch": 2.8083067092651754, "percentage": 93.91, "elapsed_time": "2:37:46", "remaining_time": "0:10:13"}
|
| 294 |
+
{"current_steps": 294, "total_steps": 312, "loss": 0.2953, "lr": 4.064920315352905e-07, "epoch": 2.817891373801917, "percentage": 94.23, "elapsed_time": "2:38:18", "remaining_time": "0:09:41"}
|
| 295 |
+
{"current_steps": 295, "total_steps": 312, "loss": 0.3698, "lr": 3.62714095277632e-07, "epoch": 2.8274760383386583, "percentage": 94.55, "elapsed_time": "2:38:53", "remaining_time": "0:09:09"}
|
| 296 |
+
{"current_steps": 296, "total_steps": 312, "loss": 0.2709, "lr": 3.214082280274067e-07, "epoch": 2.8370607028753994, "percentage": 94.87, "elapsed_time": "2:39:26", "remaining_time": "0:08:37"}
|
| 297 |
+
{"current_steps": 297, "total_steps": 312, "loss": 0.3268, "lr": 2.825796296352823e-07, "epoch": 2.8466453674121404, "percentage": 95.19, "elapsed_time": "2:40:01", "remaining_time": "0:08:04"}
|
| 298 |
+
{"current_steps": 298, "total_steps": 312, "loss": 0.3032, "lr": 2.462331880972468e-07, "epoch": 2.856230031948882, "percentage": 95.51, "elapsed_time": "2:40:29", "remaining_time": "0:07:32"}
|
| 299 |
+
{"current_steps": 299, "total_steps": 312, "loss": 0.3539, "lr": 2.123734789392673e-07, "epoch": 2.8658146964856233, "percentage": 95.83, "elapsed_time": "2:41:01", "remaining_time": "0:07:00"}
|
| 300 |
+
{"current_steps": 300, "total_steps": 312, "loss": 0.2696, "lr": 1.81004764641306e-07, "epoch": 2.8753993610223643, "percentage": 96.15, "elapsed_time": "2:41:38", "remaining_time": "0:06:27"}
|
| 301 |
+
{"current_steps": 301, "total_steps": 312, "loss": 0.3199, "lr": 1.5213099410071873e-07, "epoch": 2.8849840255591053, "percentage": 96.47, "elapsed_time": "2:42:09", "remaining_time": "0:05:55"}
|
| 302 |
+
{"current_steps": 302, "total_steps": 312, "loss": 0.3403, "lr": 1.2575580213514792e-07, "epoch": 2.8945686900958467, "percentage": 96.79, "elapsed_time": "2:42:41", "remaining_time": "0:05:23"}
|
| 303 |
+
{"current_steps": 303, "total_steps": 312, "loss": 0.3211, "lr": 1.0188250902495312e-07, "epoch": 2.9041533546325877, "percentage": 97.12, "elapsed_time": "2:43:18", "remaining_time": "0:04:51"}
|
| 304 |
+
{"current_steps": 304, "total_steps": 312, "loss": 0.3422, "lr": 8.051412009521864e-08, "epoch": 2.913738019169329, "percentage": 97.44, "elapsed_time": "2:43:48", "remaining_time": "0:04:18"}
|
| 305 |
+
{"current_steps": 305, "total_steps": 312, "loss": 0.2635, "lr": 6.165332533744072e-08, "epoch": 2.92332268370607, "percentage": 97.76, "elapsed_time": "2:44:16", "remaining_time": "0:03:46"}
|
| 306 |
+
{"current_steps": 306, "total_steps": 312, "loss": 0.2942, "lr": 4.530249907087836e-08, "epoch": 2.9329073482428116, "percentage": 98.08, "elapsed_time": "2:44:50", "remaining_time": "0:03:13"}
|
| 307 |
+
{"current_steps": 307, "total_steps": 312, "loss": 0.3829, "lr": 3.146369964366791e-08, "epoch": 2.9424920127795526, "percentage": 98.4, "elapsed_time": "2:45:20", "remaining_time": "0:02:41"}
|
| 308 |
+
{"current_steps": 308, "total_steps": 312, "loss": 0.2838, "lr": 2.0138669173708213e-08, "epoch": 2.952076677316294, "percentage": 98.72, "elapsed_time": "2:45:54", "remaining_time": "0:02:09"}
|
| 309 |
+
{"current_steps": 309, "total_steps": 312, "loss": 0.3031, "lr": 1.1328833329333767e-08, "epoch": 2.961661341853035, "percentage": 99.04, "elapsed_time": "2:46:27", "remaining_time": "0:01:36"}
|
| 310 |
+
{"current_steps": 310, "total_steps": 312, "loss": 0.3185, "lr": 5.0353011498693875e-09, "epoch": 2.9712460063897765, "percentage": 99.36, "elapsed_time": "2:46:59", "remaining_time": "0:01:04"}
|
| 311 |
+
{"current_steps": 311, "total_steps": 312, "loss": 0.2968, "lr": 1.2588649059885883e-09, "epoch": 2.9808306709265175, "percentage": 99.68, "elapsed_time": "2:47:31", "remaining_time": "0:00:32"}
|
| 312 |
+
{"current_steps": 312, "total_steps": 312, "loss": 0.3009, "lr": 0.0, "epoch": 2.9904153354632586, "percentage": 100.0, "elapsed_time": "2:48:07", "remaining_time": "0:00:00"}
|
| 313 |
+
{"current_steps": 312, "total_steps": 312, "epoch": 2.9904153354632586, "percentage": 100.0, "elapsed_time": "2:49:40", "remaining_time": "0:00:00"}
|