Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b6d66cca43133be94c69f4146dc9c245ad933cf084f93889f2b9310d406b4ba3
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:80643cacfffc1eb4481fbd284052629f60af2a517c06dc561440c36f9cbfd5cd
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22c2e6f4673a4e87dcaf42844097ffea2893652947bff088d524e37a00dc9b3f
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c1359cc5fc5e8b89c9ced4edcadc5c628d33288f4a4497a87a9db48ce6707c23
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -17,3 +17,19 @@
|
|
| 17 |
{"current_steps": 17, "total_steps": 45, "loss": 0.8017, "lr": 3.969463130731183e-06, "epoch": 1.096, "percentage": 37.78, "elapsed_time": "0:11:19", "remaining_time": "0:18:39"}
|
| 18 |
{"current_steps": 18, "total_steps": 45, "loss": 0.5691, "lr": 3.806246411789872e-06, "epoch": 1.16, "percentage": 40.0, "elapsed_time": "0:11:58", "remaining_time": "0:17:57"}
|
| 19 |
{"current_steps": 19, "total_steps": 45, "loss": 0.6708, "lr": 3.634976249348867e-06, "epoch": 1.224, "percentage": 42.22, "elapsed_time": "0:12:39", "remaining_time": "0:17:18"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 17 |
{"current_steps": 17, "total_steps": 45, "loss": 0.8017, "lr": 3.969463130731183e-06, "epoch": 1.096, "percentage": 37.78, "elapsed_time": "0:11:19", "remaining_time": "0:18:39"}
|
| 18 |
{"current_steps": 18, "total_steps": 45, "loss": 0.5691, "lr": 3.806246411789872e-06, "epoch": 1.16, "percentage": 40.0, "elapsed_time": "0:11:58", "remaining_time": "0:17:57"}
|
| 19 |
{"current_steps": 19, "total_steps": 45, "loss": 0.6708, "lr": 3.634976249348867e-06, "epoch": 1.224, "percentage": 42.22, "elapsed_time": "0:12:39", "remaining_time": "0:17:18"}
|
| 20 |
+
{"current_steps": 20, "total_steps": 45, "loss": 0.5849, "lr": 3.4567085809127247e-06, "epoch": 1.288, "percentage": 44.44, "elapsed_time": "0:13:13", "remaining_time": "0:16:31"}
|
| 21 |
+
{"current_steps": 21, "total_steps": 45, "loss": 0.6678, "lr": 3.272542485937369e-06, "epoch": 1.3519999999999999, "percentage": 46.67, "elapsed_time": "0:13:52", "remaining_time": "0:15:51"}
|
| 22 |
+
{"current_steps": 22, "total_steps": 45, "loss": 0.6192, "lr": 3.0836134096397642e-06, "epoch": 1.416, "percentage": 48.89, "elapsed_time": "0:14:31", "remaining_time": "0:15:10"}
|
| 23 |
+
{"current_steps": 23, "total_steps": 45, "loss": 0.6421, "lr": 2.8910861626005774e-06, "epoch": 1.48, "percentage": 51.11, "elapsed_time": "0:15:06", "remaining_time": "0:14:26"}
|
| 24 |
+
{"current_steps": 24, "total_steps": 45, "loss": 0.6162, "lr": 2.696147739319613e-06, "epoch": 1.544, "percentage": 53.33, "elapsed_time": "0:15:38", "remaining_time": "0:13:41"}
|
| 25 |
+
{"current_steps": 25, "total_steps": 45, "loss": 0.6482, "lr": 2.5e-06, "epoch": 1.608, "percentage": 55.56, "elapsed_time": "0:16:16", "remaining_time": "0:13:00"}
|
| 26 |
+
{"current_steps": 26, "total_steps": 45, "loss": 0.6589, "lr": 2.3038522606803882e-06, "epoch": 1.6720000000000002, "percentage": 57.78, "elapsed_time": "0:16:48", "remaining_time": "0:12:16"}
|
| 27 |
+
{"current_steps": 27, "total_steps": 45, "loss": 0.5894, "lr": 2.1089138373994226e-06, "epoch": 1.736, "percentage": 60.0, "elapsed_time": "0:17:25", "remaining_time": "0:11:36"}
|
| 28 |
+
{"current_steps": 28, "total_steps": 45, "loss": 0.6103, "lr": 1.9163865903602374e-06, "epoch": 1.8, "percentage": 62.22, "elapsed_time": "0:17:56", "remaining_time": "0:10:53"}
|
| 29 |
+
{"current_steps": 29, "total_steps": 45, "loss": 0.5794, "lr": 1.7274575140626318e-06, "epoch": 1.8639999999999999, "percentage": 64.44, "elapsed_time": "0:18:28", "remaining_time": "0:10:11"}
|
| 30 |
+
{"current_steps": 30, "total_steps": 45, "loss": 0.6615, "lr": 1.5432914190872757e-06, "epoch": 1.928, "percentage": 66.67, "elapsed_time": "0:19:01", "remaining_time": "0:09:30"}
|
| 31 |
+
{"current_steps": 31, "total_steps": 45, "loss": 0.8842, "lr": 1.3650237506511333e-06, "epoch": 1.992, "percentage": 68.89, "elapsed_time": "0:19:36", "remaining_time": "0:08:51"}
|
| 32 |
+
{"current_steps": 32, "total_steps": 45, "loss": 0.6189, "lr": 1.193753588210128e-06, "epoch": 2.064, "percentage": 71.11, "elapsed_time": "0:21:17", "remaining_time": "0:08:38"}
|
| 33 |
+
{"current_steps": 33, "total_steps": 45, "loss": 0.5628, "lr": 1.0305368692688175e-06, "epoch": 2.128, "percentage": 73.33, "elapsed_time": "0:21:45", "remaining_time": "0:07:54"}
|
| 34 |
+
{"current_steps": 34, "total_steps": 45, "loss": 0.5932, "lr": 8.763798791745413e-07, "epoch": 2.192, "percentage": 75.56, "elapsed_time": "0:22:24", "remaining_time": "0:07:14"}
|
| 35 |
+
{"current_steps": 35, "total_steps": 45, "loss": 0.5959, "lr": 7.322330470336314e-07, "epoch": 2.2560000000000002, "percentage": 77.78, "elapsed_time": "0:22:57", "remaining_time": "0:06:33"}
|