Training in progress, step 1652
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4902257696
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dbe2dd2c0c3e8724a125902f63566a6b34902b398b760cee714c477dfac9f7b1
|
| 3 |
size 4902257696
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915960368
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:98fe6a3f205d5fffbd8e9ac76fac267e14c383756a01df514ea2d0bf51de1b56
|
| 3 |
size 4915960368
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4983068496
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d25cdd0ea812470ae614866cc750a857d37dc90c276e2031b6500ba87ed54363
|
| 3 |
size 4983068496
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1580230264
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d7e4b79ffbee6cb6b7a6e6ac3fb9346f56f86095ff43899afdc74d8eb0eab0cd
|
| 3 |
size 1580230264
|
trainer_log.jsonl
CHANGED
|
@@ -318,3 +318,14 @@
|
|
| 318 |
{"current_steps": 1590, "total_steps": 1652, "loss": 0.1706, "lr": 1.7713366717344803e-07, "epoch": 6.738853503184713, "percentage": 96.25, "elapsed_time": "16:47:33", "remaining_time": "0:39:17"}
|
| 319 |
{"current_steps": 1595, "total_steps": 1652, "loss": 0.1495, "lr": 1.5016678826899055e-07, "epoch": 6.7600849256900215, "percentage": 96.55, "elapsed_time": "16:50:42", "remaining_time": "0:36:07"}
|
| 320 |
{"current_steps": 1600, "total_steps": 1652, "loss": 0.1599, "lr": 1.2541787571594522e-07, "epoch": 6.781316348195329, "percentage": 96.85, "elapsed_time": "16:53:51", "remaining_time": "0:32:57"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 318 |
{"current_steps": 1590, "total_steps": 1652, "loss": 0.1706, "lr": 1.7713366717344803e-07, "epoch": 6.738853503184713, "percentage": 96.25, "elapsed_time": "16:47:33", "remaining_time": "0:39:17"}
|
| 319 |
{"current_steps": 1595, "total_steps": 1652, "loss": 0.1495, "lr": 1.5016678826899055e-07, "epoch": 6.7600849256900215, "percentage": 96.55, "elapsed_time": "16:50:42", "remaining_time": "0:36:07"}
|
| 320 |
{"current_steps": 1600, "total_steps": 1652, "loss": 0.1599, "lr": 1.2541787571594522e-07, "epoch": 6.781316348195329, "percentage": 96.85, "elapsed_time": "16:53:51", "remaining_time": "0:32:57"}
|
| 321 |
+
{"current_steps": 1605, "total_steps": 1652, "loss": 0.1417, "lr": 1.0288969489046008e-07, "epoch": 6.802547770700637, "percentage": 97.15, "elapsed_time": "16:58:16", "remaining_time": "0:29:49"}
|
| 322 |
+
{"current_steps": 1610, "total_steps": 1652, "loss": 0.148, "lr": 8.258476303016017e-08, "epoch": 6.823779193205945, "percentage": 97.46, "elapsed_time": "17:01:27", "remaining_time": "0:26:38"}
|
| 323 |
+
{"current_steps": 1615, "total_steps": 1652, "loss": 0.1707, "lr": 6.45053489528813e-08, "epoch": 6.845010615711253, "percentage": 97.76, "elapsed_time": "17:04:36", "remaining_time": "0:23:28"}
|
| 324 |
+
{"current_steps": 1620, "total_steps": 1652, "loss": 0.1737, "lr": 4.8653472803159576e-08, "epoch": 6.86624203821656, "percentage": 98.06, "elapsed_time": "17:07:44", "remaining_time": "0:20:18"}
|
| 325 |
+
{"current_steps": 1625, "total_steps": 1652, "loss": 0.1656, "lr": 3.503090582650081e-08, "epoch": 6.887473460721869, "percentage": 98.37, "elapsed_time": "17:10:53", "remaining_time": "0:17:07"}
|
| 326 |
+
{"current_steps": 1630, "total_steps": 1652, "loss": 0.1578, "lr": 2.3639170171474434e-08, "epoch": 6.908704883227176, "percentage": 98.67, "elapsed_time": "17:14:01", "remaining_time": "0:13:57"}
|
| 327 |
+
{"current_steps": 1635, "total_steps": 1652, "loss": 0.1607, "lr": 1.4479538719622822e-08, "epoch": 6.929936305732484, "percentage": 98.97, "elapsed_time": "17:17:10", "remaining_time": "0:10:47"}
|
| 328 |
+
{"current_steps": 1640, "total_steps": 1652, "loss": 0.174, "lr": 7.553034943243998e-09, "epoch": 6.951167728237792, "percentage": 99.27, "elapsed_time": "17:20:19", "remaining_time": "0:07:36"}
|
| 329 |
+
{"current_steps": 1645, "total_steps": 1652, "loss": 0.1679, "lr": 2.8604327910186634e-09, "epoch": 6.9723991507431, "percentage": 99.58, "elapsed_time": "17:23:27", "remaining_time": "0:04:26"}
|
| 330 |
+
{"current_steps": 1650, "total_steps": 1652, "loss": 0.1742, "lr": 4.02256601546025e-10, "epoch": 6.993630573248407, "percentage": 99.88, "elapsed_time": "17:26:34", "remaining_time": "0:01:16"}
|
| 331 |
+
{"current_steps": 1652, "total_steps": 1652, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "17:28:51", "remaining_time": "0:00:00"}
|