Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e51c2b68688c65e39784574e2ad95ce905566522879d31f116353b01de077bed
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:212595710eb925e97b45a355a9bcf17f2538ff211915ba56385a1bb83c42ac26
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e0162f29fbce7b0f4ab1459375afe66c24a32fdcb304d2c57a78fe3ad90d9a5a
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2848e2acc1061595ba5ff316a24e3fb017e7bc278f4a96f0a206cdc9271d3707
|
| 3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
|
@@ -2,3 +2,8 @@
|
|
| 2 |
{"current_steps": 20, "total_steps": 99, "loss": 0.7619, "lr": 5e-06, "epoch": 0.5904059040590406, "percentage": 20.2, "elapsed_time": "0:10:42", "remaining_time": "0:42:19"}
|
| 3 |
{"current_steps": 30, "total_steps": 99, "loss": 0.7397, "lr": 5e-06, "epoch": 0.8856088560885609, "percentage": 30.3, "elapsed_time": "0:16:02", "remaining_time": "0:36:53"}
|
| 4 |
{"current_steps": 33, "total_steps": 99, "eval_loss": 0.7080272436141968, "epoch": 0.974169741697417, "percentage": 33.33, "elapsed_time": "0:18:19", "remaining_time": "0:36:38"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
{"current_steps": 20, "total_steps": 99, "loss": 0.7619, "lr": 5e-06, "epoch": 0.5904059040590406, "percentage": 20.2, "elapsed_time": "0:10:42", "remaining_time": "0:42:19"}
|
| 3 |
{"current_steps": 30, "total_steps": 99, "loss": 0.7397, "lr": 5e-06, "epoch": 0.8856088560885609, "percentage": 30.3, "elapsed_time": "0:16:02", "remaining_time": "0:36:53"}
|
| 4 |
{"current_steps": 33, "total_steps": 99, "eval_loss": 0.7080272436141968, "epoch": 0.974169741697417, "percentage": 33.33, "elapsed_time": "0:18:19", "remaining_time": "0:36:38"}
|
| 5 |
+
{"current_steps": 40, "total_steps": 99, "loss": 0.7258, "lr": 5e-06, "epoch": 1.1918819188191883, "percentage": 40.4, "elapsed_time": "0:23:00", "remaining_time": "0:33:55"}
|
| 6 |
+
{"current_steps": 50, "total_steps": 99, "loss": 0.6617, "lr": 5e-06, "epoch": 1.4870848708487086, "percentage": 50.51, "elapsed_time": "0:28:20", "remaining_time": "0:27:46"}
|
| 7 |
+
{"current_steps": 60, "total_steps": 99, "loss": 0.6487, "lr": 5e-06, "epoch": 1.7822878228782288, "percentage": 60.61, "elapsed_time": "0:33:40", "remaining_time": "0:21:53"}
|
| 8 |
+
{"current_steps": 67, "total_steps": 99, "eval_loss": 0.6627019643783569, "epoch": 1.988929889298893, "percentage": 67.68, "elapsed_time": "0:37:45", "remaining_time": "0:18:01"}
|
| 9 |
+
{"current_steps": 70, "total_steps": 99, "loss": 0.6553, "lr": 5e-06, "epoch": 2.088560885608856, "percentage": 70.71, "elapsed_time": "0:40:37", "remaining_time": "0:16:49"}
|