Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f19856a1e8c1b5d59c228fa083db4efbae8a697ddae9459cb4be66e2eb8a4db6
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2cbab3c2438931f42949da3f3d7c46971991fec6cf53d0c7d433927cb1d9a77e
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d8e732c9070365f668a83e45569ed681cc0f21fc2041e808998874ee654e917
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e3d5e3c00a34ab4a8c61c2ba9a39b101ab6a2a97ce8d3275427bc750b0f38463
|
| 3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
|
@@ -2,3 +2,8 @@
|
|
| 2 |
{"current_steps": 20, "total_steps": 105, "loss": 0.8918, "lr": 5e-06, "epoch": 0.5714285714285714, "percentage": 19.05, "elapsed_time": "0:51:48", "remaining_time": "3:40:09"}
|
| 3 |
{"current_steps": 30, "total_steps": 105, "loss": 0.853, "lr": 5e-06, "epoch": 0.8571428571428571, "percentage": 28.57, "elapsed_time": "1:17:39", "remaining_time": "3:14:09"}
|
| 4 |
{"current_steps": 35, "total_steps": 105, "eval_loss": 0.8312212824821472, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "1:32:23", "remaining_time": "3:04:46"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
{"current_steps": 20, "total_steps": 105, "loss": 0.8918, "lr": 5e-06, "epoch": 0.5714285714285714, "percentage": 19.05, "elapsed_time": "0:51:48", "remaining_time": "3:40:09"}
|
| 3 |
{"current_steps": 30, "total_steps": 105, "loss": 0.853, "lr": 5e-06, "epoch": 0.8571428571428571, "percentage": 28.57, "elapsed_time": "1:17:39", "remaining_time": "3:14:09"}
|
| 4 |
{"current_steps": 35, "total_steps": 105, "eval_loss": 0.8312212824821472, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "1:32:23", "remaining_time": "3:04:46"}
|
| 5 |
+
{"current_steps": 40, "total_steps": 105, "loss": 0.8164, "lr": 5e-06, "epoch": 1.1428571428571428, "percentage": 38.1, "elapsed_time": "1:46:40", "remaining_time": "2:53:21"}
|
| 6 |
+
{"current_steps": 50, "total_steps": 105, "loss": 0.7836, "lr": 5e-06, "epoch": 1.4285714285714286, "percentage": 47.62, "elapsed_time": "2:12:31", "remaining_time": "2:25:46"}
|
| 7 |
+
{"current_steps": 60, "total_steps": 105, "loss": 0.7806, "lr": 5e-06, "epoch": 1.7142857142857144, "percentage": 57.14, "elapsed_time": "2:38:22", "remaining_time": "1:58:46"}
|
| 8 |
+
{"current_steps": 70, "total_steps": 105, "loss": 0.7709, "lr": 5e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "3:04:13", "remaining_time": "1:32:06"}
|
| 9 |
+
{"current_steps": 70, "total_steps": 105, "eval_loss": 0.8022096753120422, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "3:06:02", "remaining_time": "1:33:01"}
|