Training in progress, epoch 6
Browse files- model-00001-of-00014.safetensors +1 -1
- model-00002-of-00014.safetensors +1 -1
- model-00003-of-00014.safetensors +1 -1
- model-00004-of-00014.safetensors +1 -1
- model-00005-of-00014.safetensors +1 -1
- model-00006-of-00014.safetensors +1 -1
- model-00007-of-00014.safetensors +1 -1
- model-00008-of-00014.safetensors +1 -1
- model-00009-of-00014.safetensors +1 -1
- model-00010-of-00014.safetensors +1 -1
- model-00011-of-00014.safetensors +1 -1
- model-00012-of-00014.safetensors +1 -1
- model-00013-of-00014.safetensors +1 -1
- model-00014-of-00014.safetensors +1 -1
- trainer_log.jsonl +33 -0
model-00001-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4891730992
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6983b72ecb9b04291bce88c65a479d79146bda8b0e9280bb123e7efac84ccc74
|
| 3 |
size 4891730992
|
model-00002-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059352
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b0c04bab2cc961616388bba9d7b0cfbc3f8c54cf2a87a8199334dab5db61f5d1
|
| 3 |
size 4876059352
|
model-00003-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059384
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e5776fa11cca967db0b68169b5c7ffcda4bf29a19f0e30507dfb05a1a0404bb3
|
| 3 |
size 4876059384
|
model-00004-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45ebad2bf3d19dea4415a9bc30ef63cf32aaf52296418d4019ef1d9babc84bc2
|
| 3 |
size 4876059416
|
model-00005-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:69c9eb54fc15da074f844554cdbd143d2a287674a8fe4e9c45675ecd27f7a524
|
| 3 |
size 4876059416
|
model-00006-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c2ce45bb129077aa62aa9c2406003a59ce969ce2b0c5dd0e35dd7b475d05123c
|
| 3 |
size 4876059416
|
model-00007-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e3d914ec6e57fca11a3b72fdf7e0f832d98ea118bf6ec6374e7e38520c8dfb02
|
| 3 |
size 4876059416
|
model-00008-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:144ec8cc7e619c97a9d84469d46ba5018e7151990cb58d7617bf2f208f2d1e34
|
| 3 |
size 4876059416
|
model-00009-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9188b3d71f13d8f52dffdbde92a2841cf381709903bca31464cff98a914fd050
|
| 3 |
size 4876059416
|
model-00010-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:94bdbb03f87554270723a6bdead26daa2da4d134316f2cbe0f58fd27744f297d
|
| 3 |
size 4876059416
|
model-00011-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:38ca40c936a55918e34f10bfef754fd5f07972125f55b248e1ae38fb6048ba2a
|
| 3 |
size 4876059416
|
model-00012-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8d3978076d3c71284ae7af0a513b32e67db75e8964cd5fe9573484761539aba5
|
| 3 |
size 4876059416
|
model-00013-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4876059416
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b149c19b1abf402b2abf4b3de425add01d7f6929b97c34931d8504293d2a673c
|
| 3 |
size 4876059416
|
model-00014-of-00014.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2123397800
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3f4302cd6003e4558fbdc49357ff2e18d22b6e1cc0dc6e3db127362022f8b79
|
| 3 |
size 2123397800
|
trainer_log.jsonl
CHANGED
|
@@ -175,3 +175,36 @@
|
|
| 175 |
{"current_steps": 175, "total_steps": 231, "loss": 0.1467, "lr": 3.399413251016359e-06, "epoch": 5.303030303030303, "percentage": 75.76, "elapsed_time": "3:26:32", "remaining_time": "1:06:05"}
|
| 176 |
{"current_steps": 176, "total_steps": 231, "loss": 0.1491, "lr": 3.2861677105440335e-06, "epoch": 5.333333333333333, "percentage": 76.19, "elapsed_time": "3:27:34", "remaining_time": "1:04:52"}
|
| 177 |
{"current_steps": 177, "total_steps": 231, "loss": 0.1164, "lr": 3.174468567813461e-06, "epoch": 5.363636363636363, "percentage": 76.62, "elapsed_time": "3:28:21", "remaining_time": "1:03:34"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 175 |
{"current_steps": 175, "total_steps": 231, "loss": 0.1467, "lr": 3.399413251016359e-06, "epoch": 5.303030303030303, "percentage": 75.76, "elapsed_time": "3:26:32", "remaining_time": "1:06:05"}
|
| 176 |
{"current_steps": 176, "total_steps": 231, "loss": 0.1491, "lr": 3.2861677105440335e-06, "epoch": 5.333333333333333, "percentage": 76.19, "elapsed_time": "3:27:34", "remaining_time": "1:04:52"}
|
| 177 |
{"current_steps": 177, "total_steps": 231, "loss": 0.1164, "lr": 3.174468567813461e-06, "epoch": 5.363636363636363, "percentage": 76.62, "elapsed_time": "3:28:21", "remaining_time": "1:03:34"}
|
| 178 |
+
{"current_steps": 178, "total_steps": 231, "loss": 0.1563, "lr": 3.0643415505006733e-06, "epoch": 5.393939393939394, "percentage": 77.06, "elapsed_time": "3:29:24", "remaining_time": "1:02:21"}
|
| 179 |
+
{"current_steps": 179, "total_steps": 231, "loss": 0.1107, "lr": 2.9558120241738786e-06, "epoch": 5.424242424242424, "percentage": 77.49, "elapsed_time": "3:30:08", "remaining_time": "1:01:02"}
|
| 180 |
+
{"current_steps": 180, "total_steps": 231, "loss": 0.1336, "lr": 2.8489049864510053e-06, "epoch": 5.454545454545454, "percentage": 77.92, "elapsed_time": "3:30:55", "remaining_time": "0:59:45"}
|
| 181 |
+
{"current_steps": 181, "total_steps": 231, "loss": 0.138, "lr": 2.7436450612420098e-06, "epoch": 5.484848484848484, "percentage": 78.35, "elapsed_time": "3:31:35", "remaining_time": "0:58:26"}
|
| 182 |
+
{"current_steps": 182, "total_steps": 231, "loss": 0.0933, "lr": 2.640056493077231e-06, "epoch": 5.515151515151516, "percentage": 78.79, "elapsed_time": "3:32:22", "remaining_time": "0:57:10"}
|
| 183 |
+
{"current_steps": 183, "total_steps": 231, "loss": 0.1347, "lr": 2.5381631415231455e-06, "epoch": 5.545454545454545, "percentage": 79.22, "elapsed_time": "3:33:16", "remaining_time": "0:55:56"}
|
| 184 |
+
{"current_steps": 184, "total_steps": 231, "loss": 0.153, "lr": 2.4379884756868167e-06, "epoch": 5.575757575757576, "percentage": 79.65, "elapsed_time": "3:34:15", "remaining_time": "0:54:43"}
|
| 185 |
+
{"current_steps": 185, "total_steps": 231, "loss": 0.1217, "lr": 2.339555568810221e-06, "epoch": 5.606060606060606, "percentage": 80.09, "elapsed_time": "3:35:04", "remaining_time": "0:53:28"}
|
| 186 |
+
{"current_steps": 186, "total_steps": 231, "loss": 0.1502, "lr": 2.2428870929558012e-06, "epoch": 5.636363636363637, "percentage": 80.52, "elapsed_time": "3:35:58", "remaining_time": "0:52:15"}
|
| 187 |
+
{"current_steps": 187, "total_steps": 231, "loss": 0.1189, "lr": 2.1480053137844115e-06, "epoch": 5.666666666666667, "percentage": 80.95, "elapsed_time": "3:36:47", "remaining_time": "0:51:00"}
|
| 188 |
+
{"current_steps": 188, "total_steps": 231, "loss": 0.1429, "lr": 2.054932085426856e-06, "epoch": 5.696969696969697, "percentage": 81.39, "elapsed_time": "3:37:45", "remaining_time": "0:49:48"}
|
| 189 |
+
{"current_steps": 189, "total_steps": 231, "loss": 0.1544, "lr": 1.963688845450218e-06, "epoch": 5.7272727272727275, "percentage": 81.82, "elapsed_time": "3:38:32", "remaining_time": "0:48:33"}
|
| 190 |
+
{"current_steps": 190, "total_steps": 231, "loss": 0.1367, "lr": 1.8742966099201699e-06, "epoch": 5.757575757575758, "percentage": 82.25, "elapsed_time": "3:39:18", "remaining_time": "0:47:19"}
|
| 191 |
+
{"current_steps": 191, "total_steps": 231, "loss": 0.1354, "lr": 1.7867759685603115e-06, "epoch": 5.787878787878788, "percentage": 82.68, "elapsed_time": "3:40:00", "remaining_time": "0:46:04"}
|
| 192 |
+
{"current_steps": 192, "total_steps": 231, "loss": 0.1224, "lr": 1.7011470800097496e-06, "epoch": 5.818181818181818, "percentage": 83.12, "elapsed_time": "3:40:55", "remaining_time": "0:44:52"}
|
| 193 |
+
{"current_steps": 193, "total_steps": 231, "loss": 0.1268, "lr": 1.6174296671799571e-06, "epoch": 5.848484848484849, "percentage": 83.55, "elapsed_time": "3:41:29", "remaining_time": "0:43:36"}
|
| 194 |
+
{"current_steps": 194, "total_steps": 231, "loss": 0.1203, "lr": 1.5356430127119915e-06, "epoch": 5.878787878787879, "percentage": 83.98, "elapsed_time": "3:42:23", "remaining_time": "0:42:24"}
|
| 195 |
+
{"current_steps": 195, "total_steps": 231, "loss": 0.1219, "lr": 1.4558059545351144e-06, "epoch": 5.909090909090909, "percentage": 84.42, "elapsed_time": "3:43:09", "remaining_time": "0:41:11"}
|
| 196 |
+
{"current_steps": 196, "total_steps": 231, "loss": 0.1541, "lr": 1.3779368815278648e-06, "epoch": 5.9393939393939394, "percentage": 84.85, "elapsed_time": "3:44:09", "remaining_time": "0:40:01"}
|
| 197 |
+
{"current_steps": 197, "total_steps": 231, "loss": 0.1178, "lr": 1.302053729282533e-06, "epoch": 5.96969696969697, "percentage": 85.28, "elapsed_time": "3:44:52", "remaining_time": "0:38:48"}
|
| 198 |
+
{"current_steps": 198, "total_steps": 231, "loss": 0.1397, "lr": 1.2281739759740575e-06, "epoch": 6.0, "percentage": 85.71, "elapsed_time": "3:45:46", "remaining_time": "0:37:37"}
|
| 199 |
+
{"current_steps": 199, "total_steps": 231, "loss": 0.1333, "lr": 1.156314638334277e-06, "epoch": 6.03030303030303, "percentage": 86.15, "elapsed_time": "3:58:01", "remaining_time": "0:38:16"}
|
| 200 |
+
{"current_steps": 200, "total_steps": 231, "loss": 0.1451, "lr": 1.086492267732462e-06, "epoch": 6.0606060606060606, "percentage": 86.58, "elapsed_time": "3:58:56", "remaining_time": "0:37:02"}
|
| 201 |
+
{"current_steps": 201, "total_steps": 231, "loss": 0.1046, "lr": 1.01872294636304e-06, "epoch": 6.090909090909091, "percentage": 87.01, "elapsed_time": "3:59:45", "remaining_time": "0:35:47"}
|
| 202 |
+
{"current_steps": 202, "total_steps": 231, "loss": 0.1017, "lr": 9.530222835413739e-07, "epoch": 6.121212121212121, "percentage": 87.45, "elapsed_time": "4:00:25", "remaining_time": "0:34:30"}
|
| 203 |
+
{"current_steps": 203, "total_steps": 231, "loss": 0.1278, "lr": 8.894054121084839e-07, "epoch": 6.151515151515151, "percentage": 87.88, "elapsed_time": "4:01:16", "remaining_time": "0:33:16"}
|
| 204 |
+
{"current_steps": 204, "total_steps": 231, "loss": 0.1403, "lr": 8.278869849454718e-07, "epoch": 6.181818181818182, "percentage": 88.31, "elapsed_time": "4:02:14", "remaining_time": "0:32:03"}
|
| 205 |
+
{"current_steps": 205, "total_steps": 231, "loss": 0.1222, "lr": 7.684811715985429e-07, "epoch": 6.212121212121212, "percentage": 88.74, "elapsed_time": "4:03:14", "remaining_time": "0:30:50"}
|
| 206 |
+
{"current_steps": 206, "total_steps": 231, "loss": 0.1313, "lr": 7.1120165501533e-07, "epoch": 6.242424242424242, "percentage": 89.18, "elapsed_time": "4:04:04", "remaining_time": "0:29:37"}
|
| 207 |
+
{"current_steps": 207, "total_steps": 231, "loss": 0.1291, "lr": 6.560616283932897e-07, "epoch": 6.2727272727272725, "percentage": 89.61, "elapsed_time": "4:05:02", "remaining_time": "0:28:24"}
|
| 208 |
+
{"current_steps": 208, "total_steps": 231, "loss": 0.1534, "lr": 6.030737921409169e-07, "epoch": 6.303030303030303, "percentage": 90.04, "elapsed_time": "4:05:54", "remaining_time": "0:27:11"}
|
| 209 |
+
{"current_steps": 209, "total_steps": 231, "loss": 0.0873, "lr": 5.522503509524591e-07, "epoch": 6.333333333333333, "percentage": 90.48, "elapsed_time": "4:06:48", "remaining_time": "0:25:58"}
|
| 210 |
+
{"current_steps": 210, "total_steps": 231, "loss": 0.1134, "lr": 5.036030109968082e-07, "epoch": 6.363636363636363, "percentage": 90.91, "elapsed_time": "4:07:42", "remaining_time": "0:24:46"}
|