Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a41ad614b2797c64d8cd3e11ff07cf575b61de092f04f0080b6ddee7d45a8c9a
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:51ac3dddb7708985cc059c7505a4b80fcbf14becbdb7e7840337c0082042060b
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb567d1783f6cde122acde16500f365c978c9d4ee5b844babec5193ac5ec2d26
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7b72094281152af5035f9a5c5d58600faa6f44b466efe7e32dae67080dc5efa5
|
| 3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
|
@@ -2,3 +2,7 @@
|
|
| 2 |
{"current_steps": 20, "total_steps": 99, "loss": 0.6311, "lr": 5e-06, "epoch": 0.6060606060606061, "percentage": 20.2, "elapsed_time": "0:52:12", "remaining_time": "3:26:14"}
|
| 3 |
{"current_steps": 30, "total_steps": 99, "loss": 0.5836, "lr": 5e-06, "epoch": 0.9090909090909091, "percentage": 30.3, "elapsed_time": "1:18:16", "remaining_time": "3:00:00"}
|
| 4 |
{"current_steps": 33, "total_steps": 99, "eval_loss": 0.5525021553039551, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "1:27:47", "remaining_time": "2:55:34"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
{"current_steps": 20, "total_steps": 99, "loss": 0.6311, "lr": 5e-06, "epoch": 0.6060606060606061, "percentage": 20.2, "elapsed_time": "0:52:12", "remaining_time": "3:26:14"}
|
| 3 |
{"current_steps": 30, "total_steps": 99, "loss": 0.5836, "lr": 5e-06, "epoch": 0.9090909090909091, "percentage": 30.3, "elapsed_time": "1:18:16", "remaining_time": "3:00:00"}
|
| 4 |
{"current_steps": 33, "total_steps": 99, "eval_loss": 0.5525021553039551, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "1:27:47", "remaining_time": "2:55:34"}
|
| 5 |
+
{"current_steps": 40, "total_steps": 99, "loss": 0.5298, "lr": 5e-06, "epoch": 1.2121212121212122, "percentage": 40.4, "elapsed_time": "1:47:22", "remaining_time": "2:38:22"}
|
| 6 |
+
{"current_steps": 50, "total_steps": 99, "loss": 0.5052, "lr": 5e-06, "epoch": 1.5151515151515151, "percentage": 50.51, "elapsed_time": "2:13:18", "remaining_time": "2:10:38"}
|
| 7 |
+
{"current_steps": 60, "total_steps": 99, "loss": 0.4923, "lr": 5e-06, "epoch": 1.8181818181818183, "percentage": 60.61, "elapsed_time": "2:39:13", "remaining_time": "1:43:29"}
|
| 8 |
+
{"current_steps": 66, "total_steps": 99, "eval_loss": 0.513215959072113, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "2:56:31", "remaining_time": "1:28:15"}
|