Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:554244aec94ede1891c5897e8d55405ef0f2b242dcdd03f8a07024370aded9b5
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:89b60273e59ccbbde7feee830b59d8f891e32439b261f4448b6ff13b0a9d3a8c
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7750bc12cd1cceccc1a830075e2fe088f4c73614d11b60a76cf28833be552823
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1e238d204f725fb028400a531a16690e989becb5c29fff3f4821303047fbc5d4
|
| 3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
|
@@ -2,3 +2,7 @@
|
|
| 2 |
{"current_steps": 20, "total_steps": 102, "loss": 0.7615, "lr": 5e-06, "epoch": 0.5871559633027523, "percentage": 19.61, "elapsed_time": "0:53:06", "remaining_time": "3:37:45"}
|
| 3 |
{"current_steps": 30, "total_steps": 102, "loss": 0.7229, "lr": 5e-06, "epoch": 0.8807339449541285, "percentage": 29.41, "elapsed_time": "1:19:24", "remaining_time": "3:10:34"}
|
| 4 |
{"current_steps": 34, "total_steps": 102, "eval_loss": 0.6932151913642883, "epoch": 0.998165137614679, "percentage": 33.33, "elapsed_time": "1:31:54", "remaining_time": "3:03:49"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
{"current_steps": 20, "total_steps": 102, "loss": 0.7615, "lr": 5e-06, "epoch": 0.5871559633027523, "percentage": 19.61, "elapsed_time": "0:53:06", "remaining_time": "3:37:45"}
|
| 3 |
{"current_steps": 30, "total_steps": 102, "loss": 0.7229, "lr": 5e-06, "epoch": 0.8807339449541285, "percentage": 29.41, "elapsed_time": "1:19:24", "remaining_time": "3:10:34"}
|
| 4 |
{"current_steps": 34, "total_steps": 102, "eval_loss": 0.6932151913642883, "epoch": 0.998165137614679, "percentage": 33.33, "elapsed_time": "1:31:54", "remaining_time": "3:03:49"}
|
| 5 |
+
{"current_steps": 40, "total_steps": 102, "loss": 0.684, "lr": 5e-06, "epoch": 1.1743119266055047, "percentage": 39.22, "elapsed_time": "1:48:54", "remaining_time": "2:48:47"}
|
| 6 |
+
{"current_steps": 50, "total_steps": 102, "loss": 0.6549, "lr": 5e-06, "epoch": 1.4678899082568808, "percentage": 49.02, "elapsed_time": "2:15:00", "remaining_time": "2:20:24"}
|
| 7 |
+
{"current_steps": 60, "total_steps": 102, "loss": 0.6412, "lr": 5e-06, "epoch": 1.761467889908257, "percentage": 58.82, "elapsed_time": "2:41:06", "remaining_time": "1:52:46"}
|
| 8 |
+
{"current_steps": 68, "total_steps": 102, "eval_loss": 0.6560695171356201, "epoch": 1.996330275229358, "percentage": 66.67, "elapsed_time": "3:04:05", "remaining_time": "1:32:02"}
|