Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:706b526132446956b812baadfb971a64b2774ec4f41e7b6a8348d9723785a8a5
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c14096fb3eaca7d4811802305de5b406645987abb8bb04d7a4063448109eb1c9
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2409d2000becd09909a0865a8e034f31c1fa62a791b9a7ef1cedf501a1327b16
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dd62595cbee2360bf20a2a8798b939257493de1f088a33967ca2a499fa454ba7
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -186,3 +186,32 @@
|
|
| 186 |
{"current_steps": 186, "total_steps": 216, "loss": 0.2161, "lr": 5.785225463498828e-07, "epoch": 2.571428571428571, "percentage": 86.11, "elapsed_time": "0:12:57", "remaining_time": "0:02:05"}
|
| 187 |
{"current_steps": 187, "total_steps": 216, "loss": 0.249, "lr": 5.412973117089288e-07, "epoch": 2.5852534562211984, "percentage": 86.57, "elapsed_time": "0:13:00", "remaining_time": "0:02:01"}
|
| 188 |
{"current_steps": 188, "total_steps": 216, "loss": 0.1794, "lr": 5.05241294573024e-07, "epoch": 2.5990783410138247, "percentage": 87.04, "elapsed_time": "0:13:03", "remaining_time": "0:01:56"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 186 |
{"current_steps": 186, "total_steps": 216, "loss": 0.2161, "lr": 5.785225463498828e-07, "epoch": 2.571428571428571, "percentage": 86.11, "elapsed_time": "0:12:57", "remaining_time": "0:02:05"}
|
| 187 |
{"current_steps": 187, "total_steps": 216, "loss": 0.249, "lr": 5.412973117089288e-07, "epoch": 2.5852534562211984, "percentage": 86.57, "elapsed_time": "0:13:00", "remaining_time": "0:02:01"}
|
| 188 |
{"current_steps": 188, "total_steps": 216, "loss": 0.1794, "lr": 5.05241294573024e-07, "epoch": 2.5990783410138247, "percentage": 87.04, "elapsed_time": "0:13:03", "remaining_time": "0:01:56"}
|
| 189 |
+
{"current_steps": 189, "total_steps": 216, "loss": 0.2483, "lr": 4.7036395000776556e-07, "epoch": 2.6129032258064515, "percentage": 87.5, "elapsed_time": "0:13:07", "remaining_time": "0:01:52"}
|
| 190 |
+
{"current_steps": 190, "total_steps": 216, "loss": 0.1891, "lr": 4.3667442399229985e-07, "epoch": 2.6267281105990783, "percentage": 87.96, "elapsed_time": "0:13:10", "remaining_time": "0:01:48"}
|
| 191 |
+
{"current_steps": 191, "total_steps": 216, "loss": 0.2294, "lr": 4.041815510209396e-07, "epoch": 2.640552995391705, "percentage": 88.43, "elapsed_time": "0:13:14", "remaining_time": "0:01:43"}
|
| 192 |
+
{"current_steps": 192, "total_steps": 216, "loss": 0.2278, "lr": 3.728938517864794e-07, "epoch": 2.654377880184332, "percentage": 88.89, "elapsed_time": "0:13:17", "remaining_time": "0:01:39"}
|
| 193 |
+
{"current_steps": 193, "total_steps": 216, "loss": 0.2144, "lr": 3.4281953094578877e-07, "epoch": 2.6682027649769586, "percentage": 89.35, "elapsed_time": "0:13:20", "remaining_time": "0:01:35"}
|
| 194 |
+
{"current_steps": 194, "total_steps": 216, "loss": 0.2517, "lr": 3.1396647496828245e-07, "epoch": 2.6820276497695854, "percentage": 89.81, "elapsed_time": "0:13:24", "remaining_time": "0:01:31"}
|
| 195 |
+
{"current_steps": 195, "total_steps": 216, "loss": 0.2611, "lr": 2.8634225006782867e-07, "epoch": 2.6958525345622117, "percentage": 90.28, "elapsed_time": "0:13:27", "remaining_time": "0:01:26"}
|
| 196 |
+
{"current_steps": 196, "total_steps": 216, "loss": 0.2059, "lr": 2.599541002186479e-07, "epoch": 2.709677419354839, "percentage": 90.74, "elapsed_time": "0:13:30", "remaining_time": "0:01:22"}
|
| 197 |
+
{"current_steps": 197, "total_steps": 216, "loss": 0.1805, "lr": 2.3480894525569564e-07, "epoch": 2.7235023041474653, "percentage": 91.2, "elapsed_time": "0:13:34", "remaining_time": "0:01:18"}
|
| 198 |
+
{"current_steps": 198, "total_steps": 216, "loss": 0.2479, "lr": 2.109133790600648e-07, "epoch": 2.737327188940092, "percentage": 91.67, "elapsed_time": "0:13:37", "remaining_time": "0:01:14"}
|
| 199 |
+
{"current_steps": 199, "total_steps": 216, "loss": 0.2388, "lr": 1.8827366782984913e-07, "epoch": 2.751152073732719, "percentage": 92.13, "elapsed_time": "0:13:41", "remaining_time": "0:01:10"}
|
| 200 |
+
{"current_steps": 200, "total_steps": 216, "loss": 0.2238, "lr": 1.6689574843694433e-07, "epoch": 2.7649769585253456, "percentage": 92.59, "elapsed_time": "0:13:44", "remaining_time": "0:01:05"}
|
| 201 |
+
{"current_steps": 201, "total_steps": 216, "loss": 0.1927, "lr": 1.4678522687020414e-07, "epoch": 2.7788018433179724, "percentage": 93.06, "elapsed_time": "0:13:47", "remaining_time": "0:01:01"}
|
| 202 |
+
{"current_steps": 202, "total_steps": 216, "loss": 0.219, "lr": 1.2794737676536993e-07, "epoch": 2.792626728110599, "percentage": 93.52, "elapsed_time": "0:13:51", "remaining_time": "0:00:57"}
|
| 203 |
+
{"current_steps": 203, "total_steps": 216, "loss": 0.2258, "lr": 1.1038713802214718e-07, "epoch": 2.806451612903226, "percentage": 93.98, "elapsed_time": "0:13:54", "remaining_time": "0:00:53"}
|
| 204 |
+
{"current_steps": 204, "total_steps": 216, "loss": 0.2272, "lr": 9.410911550880474e-08, "epoch": 2.8202764976958523, "percentage": 94.44, "elapsed_time": "0:13:58", "remaining_time": "0:00:49"}
|
| 205 |
+
{"current_steps": 205, "total_steps": 216, "loss": 0.1845, "lr": 7.911757785462882e-08, "epoch": 2.8341013824884795, "percentage": 94.91, "elapsed_time": "0:14:01", "remaining_time": "0:00:45"}
|
| 206 |
+
{"current_steps": 206, "total_steps": 216, "loss": 0.1772, "lr": 6.54164563305465e-08, "epoch": 2.847926267281106, "percentage": 95.37, "elapsed_time": "0:14:04", "remaining_time": "0:00:41"}
|
| 207 |
+
{"current_steps": 207, "total_steps": 216, "loss": 0.2429, "lr": 5.3009343818219985e-08, "epoch": 2.8617511520737327, "percentage": 95.83, "elapsed_time": "0:14:08", "remaining_time": "0:00:36"}
|
| 208 |
+
{"current_steps": 208, "total_steps": 216, "loss": 0.2, "lr": 4.189949386787462e-08, "epoch": 2.8755760368663594, "percentage": 96.3, "elapsed_time": "0:14:11", "remaining_time": "0:00:32"}
|
| 209 |
+
{"current_steps": 209, "total_steps": 216, "loss": 0.2812, "lr": 3.2089819845111946e-08, "epoch": 2.889400921658986, "percentage": 96.76, "elapsed_time": "0:14:15", "remaining_time": "0:00:28"}
|
| 210 |
+
{"current_steps": 210, "total_steps": 216, "loss": 0.2579, "lr": 2.358289416693027e-08, "epoch": 2.903225806451613, "percentage": 97.22, "elapsed_time": "0:14:18", "remaining_time": "0:00:24"}
|
| 211 |
+
{"current_steps": 211, "total_steps": 216, "loss": 0.2217, "lr": 1.6380947627153143e-08, "epoch": 2.9170506912442398, "percentage": 97.69, "elapsed_time": "0:14:22", "remaining_time": "0:00:20"}
|
| 212 |
+
{"current_steps": 212, "total_steps": 216, "loss": 0.2273, "lr": 1.0485868811441757e-08, "epoch": 2.9308755760368665, "percentage": 98.15, "elapsed_time": "0:14:25", "remaining_time": "0:00:16"}
|
| 213 |
+
{"current_steps": 213, "total_steps": 216, "loss": 0.2158, "lr": 5.899203602046655e-09, "epoch": 2.944700460829493, "percentage": 98.61, "elapsed_time": "0:14:28", "remaining_time": "0:00:12"}
|
| 214 |
+
{"current_steps": 214, "total_steps": 216, "loss": 0.2063, "lr": 2.6221547724253337e-09, "epoch": 2.9585253456221197, "percentage": 99.07, "elapsed_time": "0:14:32", "remaining_time": "0:00:08"}
|
| 215 |
+
{"current_steps": 215, "total_steps": 216, "loss": 0.2588, "lr": 6.555816718389896e-10, "epoch": 2.9723502304147464, "percentage": 99.54, "elapsed_time": "0:14:35", "remaining_time": "0:00:04"}
|
| 216 |
+
{"current_steps": 216, "total_steps": 216, "loss": 0.2179, "lr": 0.0, "epoch": 2.986175115207373, "percentage": 100.0, "elapsed_time": "0:14:38", "remaining_time": "0:00:00"}
|
| 217 |
+
{"current_steps": 216, "total_steps": 216, "epoch": 2.986175115207373, "percentage": 100.0, "elapsed_time": "0:16:46", "remaining_time": "0:00:00"}
|