Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1f26d066bb6cf52c187390bc0d9f284deae93d17fb3f6d1d50dc2ba798f8b2b
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0f3cd73dbe75492e0217884a456f781a074cdcc315257f8144fde0fc462dfe59
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ae016ecd6a3e80e702c7c025705017e8ab2224265952dc652bbb49c7b1ba033a
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7a34edd4b5b1e690f2f0f38a809d60a94d3a635af44523b39cdfb38e99545065
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -14,3 +14,13 @@
|
|
| 14 |
{"current_steps": 14, "total_steps": 30, "loss": 0.7208, "lr": 6.434016163555452e-06, "epoch": 1.34375, "percentage": 46.67, "elapsed_time": "0:07:06", "remaining_time": "0:08:07"}
|
| 15 |
{"current_steps": 15, "total_steps": 30, "loss": 0.768, "lr": 5.8682408883346535e-06, "epoch": 1.4375, "percentage": 50.0, "elapsed_time": "0:07:37", "remaining_time": "0:07:37"}
|
| 16 |
{"current_steps": 16, "total_steps": 30, "loss": 0.7986, "lr": 5.290724144552379e-06, "epoch": 1.53125, "percentage": 53.33, "elapsed_time": "0:08:06", "remaining_time": "0:07:05"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 14 |
{"current_steps": 14, "total_steps": 30, "loss": 0.7208, "lr": 6.434016163555452e-06, "epoch": 1.34375, "percentage": 46.67, "elapsed_time": "0:07:06", "remaining_time": "0:08:07"}
|
| 15 |
{"current_steps": 15, "total_steps": 30, "loss": 0.768, "lr": 5.8682408883346535e-06, "epoch": 1.4375, "percentage": 50.0, "elapsed_time": "0:07:37", "remaining_time": "0:07:37"}
|
| 16 |
{"current_steps": 16, "total_steps": 30, "loss": 0.7986, "lr": 5.290724144552379e-06, "epoch": 1.53125, "percentage": 53.33, "elapsed_time": "0:08:06", "remaining_time": "0:07:05"}
|
| 17 |
+
{"current_steps": 17, "total_steps": 30, "loss": 0.6939, "lr": 4.7092758554476215e-06, "epoch": 1.625, "percentage": 56.67, "elapsed_time": "0:08:41", "remaining_time": "0:06:38"}
|
| 18 |
+
{"current_steps": 18, "total_steps": 30, "loss": 0.7287, "lr": 4.131759111665349e-06, "epoch": 1.71875, "percentage": 60.0, "elapsed_time": "0:09:09", "remaining_time": "0:06:06"}
|
| 19 |
+
{"current_steps": 19, "total_steps": 30, "loss": 0.7368, "lr": 3.5659838364445505e-06, "epoch": 1.8125, "percentage": 63.33, "elapsed_time": "0:09:34", "remaining_time": "0:05:32"}
|
| 20 |
+
{"current_steps": 20, "total_steps": 30, "loss": 0.6756, "lr": 3.019601169804216e-06, "epoch": 1.90625, "percentage": 66.67, "elapsed_time": "0:10:01", "remaining_time": "0:05:00"}
|
| 21 |
+
{"current_steps": 21, "total_steps": 30, "loss": 1.1922, "lr": 2.5000000000000015e-06, "epoch": 2.03125, "percentage": 70.0, "elapsed_time": "0:11:14", "remaining_time": "0:04:48"}
|
| 22 |
+
{"current_steps": 22, "total_steps": 30, "loss": 0.6695, "lr": 2.0142070414860704e-06, "epoch": 2.125, "percentage": 73.33, "elapsed_time": "0:11:46", "remaining_time": "0:04:16"}
|
| 23 |
+
{"current_steps": 23, "total_steps": 30, "loss": 0.6786, "lr": 1.5687918106563326e-06, "epoch": 2.21875, "percentage": 76.67, "elapsed_time": "0:12:09", "remaining_time": "0:03:42"}
|
| 24 |
+
{"current_steps": 24, "total_steps": 30, "loss": 0.7032, "lr": 1.1697777844051105e-06, "epoch": 2.3125, "percentage": 80.0, "elapsed_time": "0:12:35", "remaining_time": "0:03:08"}
|
| 25 |
+
{"current_steps": 25, "total_steps": 30, "loss": 0.6561, "lr": 8.225609429353187e-07, "epoch": 2.40625, "percentage": 83.33, "elapsed_time": "0:13:07", "remaining_time": "0:02:37"}
|
| 26 |
+
{"current_steps": 26, "total_steps": 30, "loss": 0.6628, "lr": 5.318367983829393e-07, "epoch": 2.5, "percentage": 86.67, "elapsed_time": "0:13:30", "remaining_time": "0:02:04"}
|