Training in progress, epoch 9
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8f09846cac255d2d4417842251227d40899a159140345de33317322b364010da
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8ec5cdd9441f8aac06835bb512526c8262ee43a484a031aaac59aba12e095a32
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8f232768a6cb60f03a103ffc49f8db2b0a897024cd18b7d6f08b4a74277380b1
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c7d45fd045ab51d3375c74bca507120494838a938362349b8e099936e5e87766
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -84,3 +84,20 @@
|
|
| 84 |
{"current_steps": 84, "total_steps": 117, "loss": 0.2106, "lr": 2.245515092739488e-06, "epoch": 8.810126582278482, "percentage": 71.79, "elapsed_time": "0:41:29", "remaining_time": "0:16:17"}
|
| 85 |
{"current_steps": 85, "total_steps": 117, "loss": 0.151, "lr": 2.1219146715716332e-06, "epoch": 8.91139240506329, "percentage": 72.65, "elapsed_time": "0:41:44", "remaining_time": "0:15:42"}
|
| 86 |
{"current_steps": 86, "total_steps": 117, "loss": 0.1684, "lr": 2.0008905265604316e-06, "epoch": 9.050632911392405, "percentage": 73.5, "elapsed_time": "0:43:08", "remaining_time": "0:15:33"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 84 |
{"current_steps": 84, "total_steps": 117, "loss": 0.2106, "lr": 2.245515092739488e-06, "epoch": 8.810126582278482, "percentage": 71.79, "elapsed_time": "0:41:29", "remaining_time": "0:16:17"}
|
| 85 |
{"current_steps": 85, "total_steps": 117, "loss": 0.151, "lr": 2.1219146715716332e-06, "epoch": 8.91139240506329, "percentage": 72.65, "elapsed_time": "0:41:44", "remaining_time": "0:15:42"}
|
| 86 |
{"current_steps": 86, "total_steps": 117, "loss": 0.1684, "lr": 2.0008905265604316e-06, "epoch": 9.050632911392405, "percentage": 73.5, "elapsed_time": "0:43:08", "remaining_time": "0:15:33"}
|
| 87 |
+
{"current_steps": 87, "total_steps": 117, "loss": 0.1226, "lr": 1.8825509907063328e-06, "epoch": 9.151898734177216, "percentage": 74.36, "elapsed_time": "0:43:31", "remaining_time": "0:15:00"}
|
| 88 |
+
{"current_steps": 88, "total_steps": 117, "loss": 0.1742, "lr": 1.7670019939210025e-06, "epoch": 9.253164556962025, "percentage": 75.21, "elapsed_time": "0:43:59", "remaining_time": "0:14:29"}
|
| 89 |
+
{"current_steps": 89, "total_steps": 117, "loss": 0.1384, "lr": 1.6543469682057105e-06, "epoch": 9.354430379746836, "percentage": 76.07, "elapsed_time": "0:44:23", "remaining_time": "0:13:57"}
|
| 90 |
+
{"current_steps": 90, "total_steps": 117, "loss": 0.1457, "lr": 1.544686755065677e-06, "epoch": 9.455696202531646, "percentage": 76.92, "elapsed_time": "0:44:45", "remaining_time": "0:13:25"}
|
| 91 |
+
{"current_steps": 91, "total_steps": 117, "loss": 0.1634, "lr": 1.438119515243277e-06, "epoch": 9.556962025316455, "percentage": 77.78, "elapsed_time": "0:45:05", "remaining_time": "0:12:52"}
|
| 92 |
+
{"current_steps": 92, "total_steps": 117, "loss": 0.1603, "lr": 1.3347406408508695e-06, "epoch": 9.658227848101266, "percentage": 78.63, "elapsed_time": "0:45:27", "remaining_time": "0:12:21"}
|
| 93 |
+
{"current_steps": 93, "total_steps": 117, "loss": 0.1641, "lr": 1.234642669981946e-06, "epoch": 9.759493670886076, "percentage": 79.49, "elapsed_time": "0:45:52", "remaining_time": "0:11:50"}
|
| 94 |
+
{"current_steps": 94, "total_steps": 117, "loss": 0.2185, "lr": 1.137915203877003e-06, "epoch": 9.860759493670885, "percentage": 80.34, "elapsed_time": "0:46:25", "remaining_time": "0:11:21"}
|
| 95 |
+
{"current_steps": 95, "total_steps": 117, "loss": 0.131, "lr": 1.044644826718295e-06, "epoch": 9.962025316455696, "percentage": 81.2, "elapsed_time": "0:46:48", "remaining_time": "0:10:50"}
|
| 96 |
+
{"current_steps": 96, "total_steps": 117, "loss": 0.1025, "lr": 9.549150281252633e-07, "epoch": 10.10126582278481, "percentage": 82.05, "elapsed_time": "0:48:05", "remaining_time": "0:10:31"}
|
| 97 |
+
{"current_steps": 97, "total_steps": 117, "loss": 0.1279, "lr": 8.688061284200266e-07, "epoch": 10.20253164556962, "percentage": 82.91, "elapsed_time": "0:48:26", "remaining_time": "0:09:59"}
|
| 98 |
+
{"current_steps": 98, "total_steps": 117, "loss": 0.1781, "lr": 7.863952067298042e-07, "epoch": 10.30379746835443, "percentage": 83.76, "elapsed_time": "0:48:58", "remaining_time": "0:09:29"}
|
| 99 |
+
{"current_steps": 99, "total_steps": 117, "loss": 0.1564, "lr": 7.077560319906696e-07, "epoch": 10.405063291139241, "percentage": 84.62, "elapsed_time": "0:49:29", "remaining_time": "0:08:59"}
|
| 100 |
+
{"current_steps": 100, "total_steps": 117, "loss": 0.1901, "lr": 6.329589969143518e-07, "epoch": 10.50632911392405, "percentage": 85.47, "elapsed_time": "0:49:55", "remaining_time": "0:08:29"}
|
| 101 |
+
{"current_steps": 101, "total_steps": 117, "loss": 0.1512, "lr": 5.620710549772295e-07, "epoch": 10.60759493670886, "percentage": 86.32, "elapsed_time": "0:50:19", "remaining_time": "0:07:58"}
|
| 102 |
+
{"current_steps": 102, "total_steps": 117, "loss": 0.1403, "lr": 4.951556604879049e-07, "epoch": 10.708860759493671, "percentage": 87.18, "elapsed_time": "0:50:42", "remaining_time": "0:07:27"}
|
| 103 |
+
{"current_steps": 103, "total_steps": 117, "loss": 0.1152, "lr": 4.322727117869951e-07, "epoch": 10.810126582278482, "percentage": 88.03, "elapsed_time": "0:51:05", "remaining_time": "0:06:56"}
|