Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:53d3c966305c17c7f3f6dad55e2e51e5289f3a3ec057d741546cc85e08a5ac4e
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:db9045b12b522a8f23d5449947caefc7b6dc05234b9d4777a57eb32a2a65a3f2
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ce2c88c5166ed563fbabd42db15437680629d31cbc8bf7cfa8b075afa18a83ef
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:68beff2ef6ffc4dbe197341132e7842b8ba33698fcf1e92cc1025e228ae20f8f
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -11,3 +11,13 @@
|
|
| 11 |
{"current_steps": 11, "total_steps": 30, "loss": 1.4602, "lr": 7.985792958513932e-06, "epoch": 1.0476190476190477, "percentage": 36.67, "elapsed_time": "0:06:56", "remaining_time": "0:11:58"}
|
| 12 |
{"current_steps": 12, "total_steps": 30, "loss": 0.9868, "lr": 7.500000000000001e-06, "epoch": 1.1428571428571428, "percentage": 40.0, "elapsed_time": "0:07:29", "remaining_time": "0:11:14"}
|
| 13 |
{"current_steps": 13, "total_steps": 30, "loss": 0.819, "lr": 6.980398830195785e-06, "epoch": 1.2380952380952381, "percentage": 43.33, "elapsed_time": "0:07:56", "remaining_time": "0:10:22"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 11 |
{"current_steps": 11, "total_steps": 30, "loss": 1.4602, "lr": 7.985792958513932e-06, "epoch": 1.0476190476190477, "percentage": 36.67, "elapsed_time": "0:06:56", "remaining_time": "0:11:58"}
|
| 12 |
{"current_steps": 12, "total_steps": 30, "loss": 0.9868, "lr": 7.500000000000001e-06, "epoch": 1.1428571428571428, "percentage": 40.0, "elapsed_time": "0:07:29", "remaining_time": "0:11:14"}
|
| 13 |
{"current_steps": 13, "total_steps": 30, "loss": 0.819, "lr": 6.980398830195785e-06, "epoch": 1.2380952380952381, "percentage": 43.33, "elapsed_time": "0:07:56", "remaining_time": "0:10:22"}
|
| 14 |
+
{"current_steps": 14, "total_steps": 30, "loss": 0.9123, "lr": 6.434016163555452e-06, "epoch": 1.3333333333333333, "percentage": 46.67, "elapsed_time": "0:08:26", "remaining_time": "0:09:38"}
|
| 15 |
+
{"current_steps": 15, "total_steps": 30, "loss": 1.0189, "lr": 5.8682408883346535e-06, "epoch": 1.4285714285714286, "percentage": 50.0, "elapsed_time": "0:09:03", "remaining_time": "0:09:03"}
|
| 16 |
+
{"current_steps": 16, "total_steps": 30, "loss": 0.8441, "lr": 5.290724144552379e-06, "epoch": 1.5238095238095237, "percentage": 53.33, "elapsed_time": "0:09:33", "remaining_time": "0:08:21"}
|
| 17 |
+
{"current_steps": 17, "total_steps": 30, "loss": 0.8394, "lr": 4.7092758554476215e-06, "epoch": 1.619047619047619, "percentage": 56.67, "elapsed_time": "0:10:04", "remaining_time": "0:07:42"}
|
| 18 |
+
{"current_steps": 18, "total_steps": 30, "loss": 0.9112, "lr": 4.131759111665349e-06, "epoch": 1.7142857142857144, "percentage": 60.0, "elapsed_time": "0:10:37", "remaining_time": "0:07:05"}
|
| 19 |
+
{"current_steps": 19, "total_steps": 30, "loss": 0.9243, "lr": 3.5659838364445505e-06, "epoch": 1.8095238095238095, "percentage": 63.33, "elapsed_time": "0:11:10", "remaining_time": "0:06:28"}
|
| 20 |
+
{"current_steps": 20, "total_steps": 30, "loss": 0.9303, "lr": 3.019601169804216e-06, "epoch": 1.9047619047619047, "percentage": 66.67, "elapsed_time": "0:11:35", "remaining_time": "0:05:47"}
|
| 21 |
+
{"current_steps": 21, "total_steps": 30, "loss": 1.2204, "lr": 2.5000000000000015e-06, "epoch": 2.0, "percentage": 70.0, "elapsed_time": "0:12:05", "remaining_time": "0:05:11"}
|
| 22 |
+
{"current_steps": 22, "total_steps": 30, "loss": 0.8433, "lr": 2.0142070414860704e-06, "epoch": 2.0952380952380953, "percentage": 73.33, "elapsed_time": "0:13:31", "remaining_time": "0:04:54"}
|
| 23 |
+
{"current_steps": 23, "total_steps": 30, "loss": 0.853, "lr": 1.5687918106563326e-06, "epoch": 2.1904761904761907, "percentage": 76.67, "elapsed_time": "0:14:04", "remaining_time": "0:04:16"}
|