Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ba7fac79a9d55c12d5472170cbf9d661ae1c05dcb5a800935b2ced850700fdb2
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af4b0f8e8a934b14b20792dde1bbccbf4ce3d349286ec181ca6df374c45e5bd4
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cc035c38a33ce599320d88236efd358372aa15b753ae16a8110a5b244203898e
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f361880720fb59ab667b95745b9797cb2e3dc2ec32222e4a7f87521a0c551314
|
| 3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
|
@@ -2,3 +2,8 @@
|
|
| 2 |
{"current_steps": 20, "total_steps": 105, "loss": 0.8909, "lr": 5e-06, "epoch": 0.5714285714285714, "percentage": 19.05, "elapsed_time": "0:51:48", "remaining_time": "3:40:10"}
|
| 3 |
{"current_steps": 30, "total_steps": 105, "loss": 0.8553, "lr": 5e-06, "epoch": 0.8571428571428571, "percentage": 28.57, "elapsed_time": "1:17:38", "remaining_time": "3:14:06"}
|
| 4 |
{"current_steps": 35, "total_steps": 105, "eval_loss": 0.8304302096366882, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "1:32:22", "remaining_time": "3:04:45"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
{"current_steps": 20, "total_steps": 105, "loss": 0.8909, "lr": 5e-06, "epoch": 0.5714285714285714, "percentage": 19.05, "elapsed_time": "0:51:48", "remaining_time": "3:40:10"}
|
| 3 |
{"current_steps": 30, "total_steps": 105, "loss": 0.8553, "lr": 5e-06, "epoch": 0.8571428571428571, "percentage": 28.57, "elapsed_time": "1:17:38", "remaining_time": "3:14:06"}
|
| 4 |
{"current_steps": 35, "total_steps": 105, "eval_loss": 0.8304302096366882, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "1:32:22", "remaining_time": "3:04:45"}
|
| 5 |
+
{"current_steps": 40, "total_steps": 105, "loss": 0.82, "lr": 5e-06, "epoch": 1.1428571428571428, "percentage": 38.1, "elapsed_time": "1:46:42", "remaining_time": "2:53:23"}
|
| 6 |
+
{"current_steps": 50, "total_steps": 105, "loss": 0.7824, "lr": 5e-06, "epoch": 1.4285714285714286, "percentage": 47.62, "elapsed_time": "2:12:33", "remaining_time": "2:25:48"}
|
| 7 |
+
{"current_steps": 60, "total_steps": 105, "loss": 0.7773, "lr": 5e-06, "epoch": 1.7142857142857144, "percentage": 57.14, "elapsed_time": "2:38:24", "remaining_time": "1:58:48"}
|
| 8 |
+
{"current_steps": 70, "total_steps": 105, "loss": 0.7733, "lr": 5e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "3:04:15", "remaining_time": "1:32:07"}
|
| 9 |
+
{"current_steps": 70, "total_steps": 105, "eval_loss": 0.8000528812408447, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "3:06:04", "remaining_time": "1:33:02"}
|