Training in progress, epoch 3
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:299796797737aca4de803e67643d5532be9f3ba874fe1875484866ef86b36681
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0f72f2e6faeaf6018cd769218b5a5f60bad1935aea755f2d4a78491fca46e52c
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:df898a1fbffbfeb29a3358f7b3115a9827f040629140999246923cd11dfe93f9
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3c0c90145429fe23edde76ec70001603bc326d3fc22300d772d758442027dbd
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -35,3 +35,11 @@
|
|
| 35 |
{"current_steps": 35, "total_steps": 117, "loss": 0.3912, "lr": 8.862084796122998e-06, "epoch": 3.6582278481012658, "percentage": 29.91, "elapsed_time": "0:17:07", "remaining_time": "0:40:06"}
|
| 36 |
{"current_steps": 36, "total_steps": 117, "loss": 0.3695, "lr": 8.765357330018056e-06, "epoch": 3.759493670886076, "percentage": 30.77, "elapsed_time": "0:17:28", "remaining_time": "0:39:19"}
|
| 37 |
{"current_steps": 37, "total_steps": 117, "loss": 0.3987, "lr": 8.665259359149132e-06, "epoch": 3.8607594936708862, "percentage": 31.62, "elapsed_time": "0:17:54", "remaining_time": "0:38:42"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 35 |
{"current_steps": 35, "total_steps": 117, "loss": 0.3912, "lr": 8.862084796122998e-06, "epoch": 3.6582278481012658, "percentage": 29.91, "elapsed_time": "0:17:07", "remaining_time": "0:40:06"}
|
| 36 |
{"current_steps": 36, "total_steps": 117, "loss": 0.3695, "lr": 8.765357330018056e-06, "epoch": 3.759493670886076, "percentage": 30.77, "elapsed_time": "0:17:28", "remaining_time": "0:39:19"}
|
| 37 |
{"current_steps": 37, "total_steps": 117, "loss": 0.3987, "lr": 8.665259359149132e-06, "epoch": 3.8607594936708862, "percentage": 31.62, "elapsed_time": "0:17:54", "remaining_time": "0:38:42"}
|
| 38 |
+
{"current_steps": 38, "total_steps": 117, "loss": 0.3722, "lr": 8.561880484756726e-06, "epoch": 3.962025316455696, "percentage": 32.48, "elapsed_time": "0:18:14", "remaining_time": "0:37:54"}
|
| 39 |
+
{"current_steps": 39, "total_steps": 117, "loss": 0.3469, "lr": 8.455313244934324e-06, "epoch": 4.10126582278481, "percentage": 33.33, "elapsed_time": "0:19:41", "remaining_time": "0:39:23"}
|
| 40 |
+
{"current_steps": 40, "total_steps": 117, "loss": 0.3401, "lr": 8.345653031794292e-06, "epoch": 4.2025316455696204, "percentage": 34.19, "elapsed_time": "0:20:15", "remaining_time": "0:39:00"}
|
| 41 |
+
{"current_steps": 41, "total_steps": 117, "loss": 0.367, "lr": 8.232998006078998e-06, "epoch": 4.30379746835443, "percentage": 35.04, "elapsed_time": "0:20:43", "remaining_time": "0:38:24"}
|
| 42 |
+
{"current_steps": 42, "total_steps": 117, "loss": 0.2696, "lr": 8.117449009293668e-06, "epoch": 4.405063291139241, "percentage": 35.9, "elapsed_time": "0:21:05", "remaining_time": "0:37:40"}
|
| 43 |
+
{"current_steps": 43, "total_steps": 117, "loss": 0.3087, "lr": 7.99910947343957e-06, "epoch": 4.506329113924051, "percentage": 36.75, "elapsed_time": "0:21:40", "remaining_time": "0:37:17"}
|
| 44 |
+
{"current_steps": 44, "total_steps": 117, "loss": 0.3239, "lr": 7.87808532842837e-06, "epoch": 4.6075949367088604, "percentage": 37.61, "elapsed_time": "0:22:08", "remaining_time": "0:36:44"}
|
| 45 |
+
{"current_steps": 45, "total_steps": 117, "loss": 0.2656, "lr": 7.754484907260513e-06, "epoch": 4.708860759493671, "percentage": 38.46, "elapsed_time": "0:22:25", "remaining_time": "0:35:52"}
|