Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c6ac77c4d3ab75f4f8398e03d5e24e741271e523be61fc3042c9b0226290a896
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3675e8859016eed41791b18611ce523ea0bf757613a23b7ea3fdbec795695718
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c494d8ddd9efcc931f66c899d653dabac804500be3fa7e93c0d97b56104f5abc
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eef0c1603ed5a89a2c285196187a044c5fe290a1e122820d78289f42edda61c9
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -21,3 +21,11 @@
|
|
| 21 |
{"current_steps": 21, "total_steps": 30, "loss": 1.6283, "lr": 2.5000000000000015e-06, "epoch": 2.032, "percentage": 70.0, "elapsed_time": "0:21:00", "remaining_time": "0:09:00"}
|
| 22 |
{"current_steps": 22, "total_steps": 30, "loss": 0.9316, "lr": 2.0142070414860704e-06, "epoch": 2.128, "percentage": 73.33, "elapsed_time": "0:21:55", "remaining_time": "0:07:58"}
|
| 23 |
{"current_steps": 23, "total_steps": 30, "loss": 0.9276, "lr": 1.5687918106563326e-06, "epoch": 2.224, "percentage": 76.67, "elapsed_time": "0:22:49", "remaining_time": "0:06:56"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 21 |
{"current_steps": 21, "total_steps": 30, "loss": 1.6283, "lr": 2.5000000000000015e-06, "epoch": 2.032, "percentage": 70.0, "elapsed_time": "0:21:00", "remaining_time": "0:09:00"}
|
| 22 |
{"current_steps": 22, "total_steps": 30, "loss": 0.9316, "lr": 2.0142070414860704e-06, "epoch": 2.128, "percentage": 73.33, "elapsed_time": "0:21:55", "remaining_time": "0:07:58"}
|
| 23 |
{"current_steps": 23, "total_steps": 30, "loss": 0.9276, "lr": 1.5687918106563326e-06, "epoch": 2.224, "percentage": 76.67, "elapsed_time": "0:22:49", "remaining_time": "0:06:56"}
|
| 24 |
+
{"current_steps": 24, "total_steps": 30, "loss": 0.8732, "lr": 1.1697777844051105e-06, "epoch": 2.32, "percentage": 80.0, "elapsed_time": "0:23:30", "remaining_time": "0:05:52"}
|
| 25 |
+
{"current_steps": 25, "total_steps": 30, "loss": 0.9338, "lr": 8.225609429353187e-07, "epoch": 2.416, "percentage": 83.33, "elapsed_time": "0:24:23", "remaining_time": "0:04:52"}
|
| 26 |
+
{"current_steps": 26, "total_steps": 30, "loss": 0.908, "lr": 5.318367983829393e-07, "epoch": 2.512, "percentage": 86.67, "elapsed_time": "0:25:22", "remaining_time": "0:03:54"}
|
| 27 |
+
{"current_steps": 27, "total_steps": 30, "loss": 0.9636, "lr": 3.015368960704584e-07, "epoch": 2.608, "percentage": 90.0, "elapsed_time": "0:26:18", "remaining_time": "0:02:55"}
|
| 28 |
+
{"current_steps": 28, "total_steps": 30, "loss": 0.941, "lr": 1.3477564710088097e-07, "epoch": 2.7039999999999997, "percentage": 93.33, "elapsed_time": "0:27:12", "remaining_time": "0:01:56"}
|
| 29 |
+
{"current_steps": 29, "total_steps": 30, "loss": 0.8554, "lr": 3.3808211290284886e-08, "epoch": 2.8, "percentage": 96.67, "elapsed_time": "0:27:58", "remaining_time": "0:00:57"}
|
| 30 |
+
{"current_steps": 30, "total_steps": 30, "loss": 1.0298, "lr": 0.0, "epoch": 2.896, "percentage": 100.0, "elapsed_time": "0:28:53", "remaining_time": "0:00:00"}
|
| 31 |
+
{"current_steps": 30, "total_steps": 30, "epoch": 2.896, "percentage": 100.0, "elapsed_time": "0:31:03", "remaining_time": "0:00:00"}
|