Training in progress, step 2600
Browse files- model.safetensors +1 -1
- trainer_log.jsonl +25 -0
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 3554214752
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bacff4e2022fc15a0007d97c52cc61a1f749c7d46fa0b3922ffbbe34b92789cb
|
| 3 |
size 3554214752
|
trainer_log.jsonl
CHANGED
|
@@ -238,3 +238,28 @@
|
|
| 238 |
{"current_steps": 2380, "total_steps": 3235, "loss": 0.0088, "lr": 3.972133925115125e-06, "epoch": 0.7358169732570722, "percentage": 73.57, "elapsed_time": "1 day, 14:51:42", "remaining_time": "13:57:39"}
|
| 239 |
{"current_steps": 2390, "total_steps": 3235, "loss": 0.0088, "lr": 3.8863758593510074e-06, "epoch": 0.7389086412119339, "percentage": 73.88, "elapsed_time": "1 day, 15:01:23", "remaining_time": "13:47:48"}
|
| 240 |
{"current_steps": 2400, "total_steps": 3235, "loss": 0.0089, "lr": 3.801329842543745e-06, "epoch": 0.7420003091667955, "percentage": 74.19, "elapsed_time": "1 day, 15:11:01", "remaining_time": "13:37:57"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 238 |
{"current_steps": 2380, "total_steps": 3235, "loss": 0.0088, "lr": 3.972133925115125e-06, "epoch": 0.7358169732570722, "percentage": 73.57, "elapsed_time": "1 day, 14:51:42", "remaining_time": "13:57:39"}
|
| 239 |
{"current_steps": 2390, "total_steps": 3235, "loss": 0.0088, "lr": 3.8863758593510074e-06, "epoch": 0.7389086412119339, "percentage": 73.88, "elapsed_time": "1 day, 15:01:23", "remaining_time": "13:47:48"}
|
| 240 |
{"current_steps": 2400, "total_steps": 3235, "loss": 0.0089, "lr": 3.801329842543745e-06, "epoch": 0.7420003091667955, "percentage": 74.19, "elapsed_time": "1 day, 15:11:01", "remaining_time": "13:37:57"}
|
| 241 |
+
{"current_steps": 2410, "total_steps": 3235, "loss": 0.0083, "lr": 3.717005779935482e-06, "epoch": 0.7450919771216571, "percentage": 74.5, "elapsed_time": "1 day, 15:21:56", "remaining_time": "13:28:32"}
|
| 242 |
+
{"current_steps": 2420, "total_steps": 3235, "loss": 0.0087, "lr": 3.633413492682952e-06, "epoch": 0.7481836450765188, "percentage": 74.81, "elapsed_time": "1 day, 15:31:36", "remaining_time": "13:18:42"}
|
| 243 |
+
{"current_steps": 2430, "total_steps": 3235, "loss": 0.0092, "lr": 3.5505627167135713e-06, "epoch": 0.7512753130313804, "percentage": 75.12, "elapsed_time": "1 day, 15:41:15", "remaining_time": "13:08:51"}
|
| 244 |
+
{"current_steps": 2440, "total_steps": 3235, "loss": 0.0088, "lr": 3.4684631015915405e-06, "epoch": 0.7543669809862421, "percentage": 75.43, "elapsed_time": "1 day, 15:51:04", "remaining_time": "12:59:03"}
|
| 245 |
+
{"current_steps": 2450, "total_steps": 3235, "loss": 0.0086, "lr": 3.3871242093939336e-06, "epoch": 0.7574586489411037, "percentage": 75.73, "elapsed_time": "1 day, 16:00:51", "remaining_time": "12:49:15"}
|
| 246 |
+
{"current_steps": 2460, "total_steps": 3235, "loss": 0.0085, "lr": 3.3065555135970563e-06, "epoch": 0.7605503168959654, "percentage": 76.04, "elapsed_time": "1 day, 16:10:41", "remaining_time": "12:39:27"}
|
| 247 |
+
{"current_steps": 2470, "total_steps": 3235, "loss": 0.0081, "lr": 3.226766397973021e-06, "epoch": 0.763641984850827, "percentage": 76.35, "elapsed_time": "1 day, 16:20:23", "remaining_time": "12:29:38"}
|
| 248 |
+
{"current_steps": 2480, "total_steps": 3235, "loss": 0.009, "lr": 3.1477661554968754e-06, "epoch": 0.7667336528056886, "percentage": 76.66, "elapsed_time": "1 day, 16:30:05", "remaining_time": "12:19:48"}
|
| 249 |
+
{"current_steps": 2490, "total_steps": 3235, "loss": 0.0088, "lr": 3.0695639872642312e-06, "epoch": 0.7698253207605503, "percentage": 76.97, "elapsed_time": "1 day, 16:39:46", "remaining_time": "12:09:58"}
|
| 250 |
+
{"current_steps": 2500, "total_steps": 3235, "loss": 0.0084, "lr": 2.9921690014196146e-06, "epoch": 0.7729169887154119, "percentage": 77.28, "elapsed_time": "1 day, 16:49:31", "remaining_time": "12:00:09"}
|
| 251 |
+
{"current_steps": 2510, "total_steps": 3235, "loss": 0.009, "lr": 2.915590212095685e-06, "epoch": 0.7760086566702736, "percentage": 77.59, "elapsed_time": "1 day, 17:00:27", "remaining_time": "11:50:41"}
|
| 252 |
+
{"current_steps": 2520, "total_steps": 3235, "loss": 0.0085, "lr": 2.83983653836331e-06, "epoch": 0.7791003246251352, "percentage": 77.9, "elapsed_time": "1 day, 17:10:03", "remaining_time": "11:40:49"}
|
| 253 |
+
{"current_steps": 2530, "total_steps": 3235, "loss": 0.0088, "lr": 2.764916803192822e-06, "epoch": 0.7821919925799969, "percentage": 78.21, "elapsed_time": "1 day, 17:19:49", "remaining_time": "11:31:01"}
|
| 254 |
+
{"current_steps": 2540, "total_steps": 3235, "loss": 0.0086, "lr": 2.6908397324263746e-06, "epoch": 0.7852836605348585, "percentage": 78.52, "elapsed_time": "1 day, 17:29:35", "remaining_time": "11:21:12"}
|
| 255 |
+
{"current_steps": 2550, "total_steps": 3235, "loss": 0.0083, "lr": 2.617613953761675e-06, "epoch": 0.7883753284897203, "percentage": 78.83, "elapsed_time": "1 day, 17:39:13", "remaining_time": "11:11:21"}
|
| 256 |
+
{"current_steps": 2560, "total_steps": 3235, "loss": 0.0087, "lr": 2.545247995747111e-06, "epoch": 0.7914669964445818, "percentage": 79.13, "elapsed_time": "1 day, 17:48:59", "remaining_time": "11:01:33"}
|
| 257 |
+
{"current_steps": 2570, "total_steps": 3235, "loss": 0.0083, "lr": 2.4737502867884435e-06, "epoch": 0.7945586643994434, "percentage": 79.44, "elapsed_time": "1 day, 17:58:46", "remaining_time": "10:51:44"}
|
| 258 |
+
{"current_steps": 2580, "total_steps": 3235, "loss": 0.0083, "lr": 2.403129154167153e-06, "epoch": 0.7976503323543052, "percentage": 79.75, "elapsed_time": "1 day, 18:08:30", "remaining_time": "10:41:55"}
|
| 259 |
+
{"current_steps": 2590, "total_steps": 3235, "loss": 0.0088, "lr": 2.3333928230705607e-06, "epoch": 0.8007420003091668, "percentage": 80.06, "elapsed_time": "1 day, 18:18:06", "remaining_time": "10:32:04"}
|
| 260 |
+
{"current_steps": 2600, "total_steps": 3235, "loss": 0.0083, "lr": 2.2645494156338753e-06, "epoch": 0.8038336682640285, "percentage": 80.37, "elapsed_time": "1 day, 18:27:44", "remaining_time": "10:22:14"}
|
| 261 |
+
{"current_steps": 2610, "total_steps": 3235, "loss": 0.0087, "lr": 2.1966069499941736e-06, "epoch": 0.8069253362188901, "percentage": 80.68, "elapsed_time": "1 day, 18:38:32", "remaining_time": "10:12:40"}
|
| 262 |
+
{"current_steps": 2620, "total_steps": 3235, "loss": 0.0087, "lr": 2.129573339356571e-06, "epoch": 0.8100170041737518, "percentage": 80.99, "elapsed_time": "1 day, 18:48:10", "remaining_time": "10:02:50"}
|
| 263 |
+
{"current_steps": 2630, "total_steps": 3235, "loss": 0.0085, "lr": 2.063456391072548e-06, "epoch": 0.8131086721286134, "percentage": 81.3, "elapsed_time": "1 day, 18:57:51", "remaining_time": "9:53:00"}
|
| 264 |
+
{"current_steps": 2640, "total_steps": 3235, "loss": 0.0092, "lr": 1.998263805730658e-06, "epoch": 0.8162003400834751, "percentage": 81.61, "elapsed_time": "1 day, 19:07:30", "remaining_time": "9:43:10"}
|
| 265 |
+
{"current_steps": 2650, "total_steps": 3235, "loss": 0.0085, "lr": 1.9340031762596322e-06, "epoch": 0.8192920080383367, "percentage": 81.92, "elapsed_time": "1 day, 19:17:14", "remaining_time": "9:33:21"}
|