Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b08b2efedb963a297454b19b9a93b84c55c66611a8fd5c4401e8a0aaa0f22005
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ac2d95a09d4c3b39e6f62419c954b2abb9acc6ad86d50850a123fe18884e8c62
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6b3f3c1a14d52e37be4c8cb799f9df3e79bdff8a99b6e6c72357d17f075ea08c
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8409661ef7c3b5a47b468f5e4462d8d7f5affeee69dbedf8e9500a5935b0078d
|
| 3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
|
@@ -14,3 +14,13 @@
|
|
| 14 |
{"current_steps": 130, "total_steps": 246, "loss": 0.4991, "lr": 5e-06, "epoch": 1.5811836115326252, "percentage": 52.85, "elapsed_time": "0:52:45", "remaining_time": "0:47:04"}
|
| 15 |
{"current_steps": 140, "total_steps": 246, "loss": 0.4973, "lr": 5e-06, "epoch": 1.7025796661608497, "percentage": 56.91, "elapsed_time": "0:56:38", "remaining_time": "0:42:53"}
|
| 16 |
{"current_steps": 150, "total_steps": 246, "loss": 0.501, "lr": 5e-06, "epoch": 1.8239757207890743, "percentage": 60.98, "elapsed_time": "1:00:35", "remaining_time": "0:38:46"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 14 |
{"current_steps": 130, "total_steps": 246, "loss": 0.4991, "lr": 5e-06, "epoch": 1.5811836115326252, "percentage": 52.85, "elapsed_time": "0:52:45", "remaining_time": "0:47:04"}
|
| 15 |
{"current_steps": 140, "total_steps": 246, "loss": 0.4973, "lr": 5e-06, "epoch": 1.7025796661608497, "percentage": 56.91, "elapsed_time": "0:56:38", "remaining_time": "0:42:53"}
|
| 16 |
{"current_steps": 150, "total_steps": 246, "loss": 0.501, "lr": 5e-06, "epoch": 1.8239757207890743, "percentage": 60.98, "elapsed_time": "1:00:35", "remaining_time": "0:38:46"}
|
| 17 |
+
{"current_steps": 160, "total_steps": 246, "loss": 0.4963, "lr": 5e-06, "epoch": 1.945371775417299, "percentage": 65.04, "elapsed_time": "1:04:29", "remaining_time": "0:34:39"}
|
| 18 |
+
{"current_steps": 164, "total_steps": 246, "eval_loss": 0.5243988037109375, "epoch": 1.9939301972685888, "percentage": 66.67, "elapsed_time": "1:06:39", "remaining_time": "0:33:19"}
|
| 19 |
+
{"current_steps": 170, "total_steps": 246, "loss": 0.5178, "lr": 5e-06, "epoch": 2.069802731411229, "percentage": 69.11, "elapsed_time": "1:10:34", "remaining_time": "0:31:33"}
|
| 20 |
+
{"current_steps": 180, "total_steps": 246, "loss": 0.4477, "lr": 5e-06, "epoch": 2.191198786039454, "percentage": 73.17, "elapsed_time": "1:14:27", "remaining_time": "0:27:18"}
|
| 21 |
+
{"current_steps": 190, "total_steps": 246, "loss": 0.4478, "lr": 5e-06, "epoch": 2.3125948406676784, "percentage": 77.24, "elapsed_time": "1:18:20", "remaining_time": "0:23:05"}
|
| 22 |
+
{"current_steps": 200, "total_steps": 246, "loss": 0.45, "lr": 5e-06, "epoch": 2.433990895295903, "percentage": 81.3, "elapsed_time": "1:22:13", "remaining_time": "0:18:54"}
|
| 23 |
+
{"current_steps": 210, "total_steps": 246, "loss": 0.4474, "lr": 5e-06, "epoch": 2.5553869499241273, "percentage": 85.37, "elapsed_time": "1:26:06", "remaining_time": "0:14:45"}
|
| 24 |
+
{"current_steps": 220, "total_steps": 246, "loss": 0.4493, "lr": 5e-06, "epoch": 2.676783004552352, "percentage": 89.43, "elapsed_time": "1:30:01", "remaining_time": "0:10:38"}
|
| 25 |
+
{"current_steps": 230, "total_steps": 246, "loss": 0.4476, "lr": 5e-06, "epoch": 2.7981790591805766, "percentage": 93.5, "elapsed_time": "1:33:54", "remaining_time": "0:06:31"}
|
| 26 |
+
{"current_steps": 240, "total_steps": 246, "loss": 0.4507, "lr": 5e-06, "epoch": 2.919575113808801, "percentage": 97.56, "elapsed_time": "1:37:47", "remaining_time": "0:02:26"}
|