Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aabd14eb991de378cec947dec46e2c4fe49a8eb58afc7585ea8dd51f18f41bd0
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6cd2890f1463cfd889f74f1b6e6eabc12fdf867eecf85dad2ddca6ef780cb67c
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:49f54d8dfefb6c6d67acc0e5db8184594389ef5b8b516809e23e02e812766500
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1bd7934a088dc7a4e163013a8d6ef48297394687f828e57a948e7ecd6c158982
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -10,3 +10,14 @@
|
|
| 10 |
{"current_steps": 10, "total_steps": 30, "loss": 1.0839, "lr": 8.43120818934367e-06, "epoch": 0.96, "percentage": 33.33, "elapsed_time": "0:09:03", "remaining_time": "0:18:07"}
|
| 11 |
{"current_steps": 11, "total_steps": 30, "loss": 1.6738, "lr": 7.985792958513932e-06, "epoch": 1.064, "percentage": 36.67, "elapsed_time": "0:11:07", "remaining_time": "0:19:13"}
|
| 12 |
{"current_steps": 12, "total_steps": 30, "loss": 1.0706, "lr": 7.500000000000001e-06, "epoch": 1.16, "percentage": 40.0, "elapsed_time": "0:12:00", "remaining_time": "0:18:00"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10 |
{"current_steps": 10, "total_steps": 30, "loss": 1.0839, "lr": 8.43120818934367e-06, "epoch": 0.96, "percentage": 33.33, "elapsed_time": "0:09:03", "remaining_time": "0:18:07"}
|
| 11 |
{"current_steps": 11, "total_steps": 30, "loss": 1.6738, "lr": 7.985792958513932e-06, "epoch": 1.064, "percentage": 36.67, "elapsed_time": "0:11:07", "remaining_time": "0:19:13"}
|
| 12 |
{"current_steps": 12, "total_steps": 30, "loss": 1.0706, "lr": 7.500000000000001e-06, "epoch": 1.16, "percentage": 40.0, "elapsed_time": "0:12:00", "remaining_time": "0:18:00"}
|
| 13 |
+
{"current_steps": 13, "total_steps": 30, "loss": 1.0189, "lr": 6.980398830195785e-06, "epoch": 1.256, "percentage": 43.33, "elapsed_time": "0:12:51", "remaining_time": "0:16:48"}
|
| 14 |
+
{"current_steps": 14, "total_steps": 30, "loss": 1.028, "lr": 6.434016163555452e-06, "epoch": 1.3519999999999999, "percentage": 46.67, "elapsed_time": "0:13:36", "remaining_time": "0:15:33"}
|
| 15 |
+
{"current_steps": 15, "total_steps": 30, "loss": 0.9001, "lr": 5.8682408883346535e-06, "epoch": 1.448, "percentage": 50.0, "elapsed_time": "0:14:22", "remaining_time": "0:14:22"}
|
| 16 |
+
{"current_steps": 16, "total_steps": 30, "loss": 1.0615, "lr": 5.290724144552379e-06, "epoch": 1.544, "percentage": 53.33, "elapsed_time": "0:15:17", "remaining_time": "0:13:22"}
|
| 17 |
+
{"current_steps": 17, "total_steps": 30, "loss": 0.9473, "lr": 4.7092758554476215e-06, "epoch": 1.6400000000000001, "percentage": 56.67, "elapsed_time": "0:16:10", "remaining_time": "0:12:22"}
|
| 18 |
+
{"current_steps": 18, "total_steps": 30, "loss": 0.9851, "lr": 4.131759111665349e-06, "epoch": 1.736, "percentage": 60.0, "elapsed_time": "0:17:04", "remaining_time": "0:11:23"}
|
| 19 |
+
{"current_steps": 19, "total_steps": 30, "loss": 0.8426, "lr": 3.5659838364445505e-06, "epoch": 1.8319999999999999, "percentage": 63.33, "elapsed_time": "0:17:58", "remaining_time": "0:10:24"}
|
| 20 |
+
{"current_steps": 20, "total_steps": 30, "loss": 1.0051, "lr": 3.019601169804216e-06, "epoch": 1.928, "percentage": 66.67, "elapsed_time": "0:18:57", "remaining_time": "0:09:28"}
|
| 21 |
+
{"current_steps": 21, "total_steps": 30, "loss": 1.6283, "lr": 2.5000000000000015e-06, "epoch": 2.032, "percentage": 70.0, "elapsed_time": "0:21:00", "remaining_time": "0:09:00"}
|
| 22 |
+
{"current_steps": 22, "total_steps": 30, "loss": 0.9316, "lr": 2.0142070414860704e-06, "epoch": 2.128, "percentage": 73.33, "elapsed_time": "0:21:55", "remaining_time": "0:07:58"}
|
| 23 |
+
{"current_steps": 23, "total_steps": 30, "loss": 0.9276, "lr": 1.5687918106563326e-06, "epoch": 2.224, "percentage": 76.67, "elapsed_time": "0:22:49", "remaining_time": "0:06:56"}
|