neginr commited on
Commit
0cde6c8
·
verified ·
1 Parent(s): f20b62b

Training in progress, epoch 6

Browse files
model-00001-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b750e152ec4f97d177dfb1f7ce9860180942bed9b41d68b034a5cda9d706aaa8
3
  size 4891730992
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6983b72ecb9b04291bce88c65a479d79146bda8b0e9280bb123e7efac84ccc74
3
  size 4891730992
model-00002-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1b081b5eca9af769d59a53110f04455733a84ec7bbbb52a75ded49bd10b26e58
3
  size 4876059352
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0c04bab2cc961616388bba9d7b0cfbc3f8c54cf2a87a8199334dab5db61f5d1
3
  size 4876059352
model-00003-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6399dc4a2b115eccb1275a9e90a0094a6a9d3c341dad1a48d522cba1d61a2d58
3
  size 4876059384
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5776fa11cca967db0b68169b5c7ffcda4bf29a19f0e30507dfb05a1a0404bb3
3
  size 4876059384
model-00004-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e2d9cef2bf8fc73d42354ea7b879c6bd40acb3d72bad2759b78bdb9d57332b94
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45ebad2bf3d19dea4415a9bc30ef63cf32aaf52296418d4019ef1d9babc84bc2
3
  size 4876059416
model-00005-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c249729690c7dcba7889503cf5857c00ad6f5d199078d793a0afe5207c400c74
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69c9eb54fc15da074f844554cdbd143d2a287674a8fe4e9c45675ecd27f7a524
3
  size 4876059416
model-00006-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:94837d858e92d9ead6fe2dfc36d4f7b170f51f151e96b6ec79f85bc1a8d7391d
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2ce45bb129077aa62aa9c2406003a59ce969ce2b0c5dd0e35dd7b475d05123c
3
  size 4876059416
model-00007-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b0221bdea8a3deac23a20caa9504f982ab315e28632cf683f65350092ce5d488
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3d914ec6e57fca11a3b72fdf7e0f832d98ea118bf6ec6374e7e38520c8dfb02
3
  size 4876059416
model-00008-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f8a83482e46fd5be75ff6ec520226a8d3a0d2f706f40992f5db6d3374a98baf
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:144ec8cc7e619c97a9d84469d46ba5018e7151990cb58d7617bf2f208f2d1e34
3
  size 4876059416
model-00009-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:881f64a12809f1df8d49824a9992c41d1d66105b254bb40d64f3c51475226244
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9188b3d71f13d8f52dffdbde92a2841cf381709903bca31464cff98a914fd050
3
  size 4876059416
model-00010-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bbe63b6969e9fe6464188af051faa86b28326e59b18cf8c98c8bd7990e0e089a
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:94bdbb03f87554270723a6bdead26daa2da4d134316f2cbe0f58fd27744f297d
3
  size 4876059416
model-00011-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:51c97af867cb1c4b38f8ca5f98d0b0a0b31da7c086a8f9e2e57d4a0d939b7087
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:38ca40c936a55918e34f10bfef754fd5f07972125f55b248e1ae38fb6048ba2a
3
  size 4876059416
model-00012-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d5364fbd822dc35ddaffb54b37523a8df9b7d4342179fd3f652e363936da3ee
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d3978076d3c71284ae7af0a513b32e67db75e8964cd5fe9573484761539aba5
3
  size 4876059416
model-00013-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:797767b2aef5733a94722f090e24b859f8d7f92e31ecb0bac55cad81f7fed2b7
3
  size 4876059416
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b149c19b1abf402b2abf4b3de425add01d7f6929b97c34931d8504293d2a673c
3
  size 4876059416
model-00014-of-00014.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d91748903a27c7eb34bbf21fc71d8bb87a749decd99dd58f709be69b25e77435
3
  size 2123397800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d3f4302cd6003e4558fbdc49357ff2e18d22b6e1cc0dc6e3db127362022f8b79
3
  size 2123397800
trainer_log.jsonl CHANGED
@@ -175,3 +175,36 @@
175
  {"current_steps": 175, "total_steps": 231, "loss": 0.1467, "lr": 3.399413251016359e-06, "epoch": 5.303030303030303, "percentage": 75.76, "elapsed_time": "3:26:32", "remaining_time": "1:06:05"}
176
  {"current_steps": 176, "total_steps": 231, "loss": 0.1491, "lr": 3.2861677105440335e-06, "epoch": 5.333333333333333, "percentage": 76.19, "elapsed_time": "3:27:34", "remaining_time": "1:04:52"}
177
  {"current_steps": 177, "total_steps": 231, "loss": 0.1164, "lr": 3.174468567813461e-06, "epoch": 5.363636363636363, "percentage": 76.62, "elapsed_time": "3:28:21", "remaining_time": "1:03:34"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
175
  {"current_steps": 175, "total_steps": 231, "loss": 0.1467, "lr": 3.399413251016359e-06, "epoch": 5.303030303030303, "percentage": 75.76, "elapsed_time": "3:26:32", "remaining_time": "1:06:05"}
176
  {"current_steps": 176, "total_steps": 231, "loss": 0.1491, "lr": 3.2861677105440335e-06, "epoch": 5.333333333333333, "percentage": 76.19, "elapsed_time": "3:27:34", "remaining_time": "1:04:52"}
177
  {"current_steps": 177, "total_steps": 231, "loss": 0.1164, "lr": 3.174468567813461e-06, "epoch": 5.363636363636363, "percentage": 76.62, "elapsed_time": "3:28:21", "remaining_time": "1:03:34"}
178
+ {"current_steps": 178, "total_steps": 231, "loss": 0.1563, "lr": 3.0643415505006733e-06, "epoch": 5.393939393939394, "percentage": 77.06, "elapsed_time": "3:29:24", "remaining_time": "1:02:21"}
179
+ {"current_steps": 179, "total_steps": 231, "loss": 0.1107, "lr": 2.9558120241738786e-06, "epoch": 5.424242424242424, "percentage": 77.49, "elapsed_time": "3:30:08", "remaining_time": "1:01:02"}
180
+ {"current_steps": 180, "total_steps": 231, "loss": 0.1336, "lr": 2.8489049864510053e-06, "epoch": 5.454545454545454, "percentage": 77.92, "elapsed_time": "3:30:55", "remaining_time": "0:59:45"}
181
+ {"current_steps": 181, "total_steps": 231, "loss": 0.138, "lr": 2.7436450612420098e-06, "epoch": 5.484848484848484, "percentage": 78.35, "elapsed_time": "3:31:35", "remaining_time": "0:58:26"}
182
+ {"current_steps": 182, "total_steps": 231, "loss": 0.0933, "lr": 2.640056493077231e-06, "epoch": 5.515151515151516, "percentage": 78.79, "elapsed_time": "3:32:22", "remaining_time": "0:57:10"}
183
+ {"current_steps": 183, "total_steps": 231, "loss": 0.1347, "lr": 2.5381631415231455e-06, "epoch": 5.545454545454545, "percentage": 79.22, "elapsed_time": "3:33:16", "remaining_time": "0:55:56"}
184
+ {"current_steps": 184, "total_steps": 231, "loss": 0.153, "lr": 2.4379884756868167e-06, "epoch": 5.575757575757576, "percentage": 79.65, "elapsed_time": "3:34:15", "remaining_time": "0:54:43"}
185
+ {"current_steps": 185, "total_steps": 231, "loss": 0.1217, "lr": 2.339555568810221e-06, "epoch": 5.606060606060606, "percentage": 80.09, "elapsed_time": "3:35:04", "remaining_time": "0:53:28"}
186
+ {"current_steps": 186, "total_steps": 231, "loss": 0.1502, "lr": 2.2428870929558012e-06, "epoch": 5.636363636363637, "percentage": 80.52, "elapsed_time": "3:35:58", "remaining_time": "0:52:15"}
187
+ {"current_steps": 187, "total_steps": 231, "loss": 0.1189, "lr": 2.1480053137844115e-06, "epoch": 5.666666666666667, "percentage": 80.95, "elapsed_time": "3:36:47", "remaining_time": "0:51:00"}
188
+ {"current_steps": 188, "total_steps": 231, "loss": 0.1429, "lr": 2.054932085426856e-06, "epoch": 5.696969696969697, "percentage": 81.39, "elapsed_time": "3:37:45", "remaining_time": "0:49:48"}
189
+ {"current_steps": 189, "total_steps": 231, "loss": 0.1544, "lr": 1.963688845450218e-06, "epoch": 5.7272727272727275, "percentage": 81.82, "elapsed_time": "3:38:32", "remaining_time": "0:48:33"}
190
+ {"current_steps": 190, "total_steps": 231, "loss": 0.1367, "lr": 1.8742966099201699e-06, "epoch": 5.757575757575758, "percentage": 82.25, "elapsed_time": "3:39:18", "remaining_time": "0:47:19"}
191
+ {"current_steps": 191, "total_steps": 231, "loss": 0.1354, "lr": 1.7867759685603115e-06, "epoch": 5.787878787878788, "percentage": 82.68, "elapsed_time": "3:40:00", "remaining_time": "0:46:04"}
192
+ {"current_steps": 192, "total_steps": 231, "loss": 0.1224, "lr": 1.7011470800097496e-06, "epoch": 5.818181818181818, "percentage": 83.12, "elapsed_time": "3:40:55", "remaining_time": "0:44:52"}
193
+ {"current_steps": 193, "total_steps": 231, "loss": 0.1268, "lr": 1.6174296671799571e-06, "epoch": 5.848484848484849, "percentage": 83.55, "elapsed_time": "3:41:29", "remaining_time": "0:43:36"}
194
+ {"current_steps": 194, "total_steps": 231, "loss": 0.1203, "lr": 1.5356430127119915e-06, "epoch": 5.878787878787879, "percentage": 83.98, "elapsed_time": "3:42:23", "remaining_time": "0:42:24"}
195
+ {"current_steps": 195, "total_steps": 231, "loss": 0.1219, "lr": 1.4558059545351144e-06, "epoch": 5.909090909090909, "percentage": 84.42, "elapsed_time": "3:43:09", "remaining_time": "0:41:11"}
196
+ {"current_steps": 196, "total_steps": 231, "loss": 0.1541, "lr": 1.3779368815278648e-06, "epoch": 5.9393939393939394, "percentage": 84.85, "elapsed_time": "3:44:09", "remaining_time": "0:40:01"}
197
+ {"current_steps": 197, "total_steps": 231, "loss": 0.1178, "lr": 1.302053729282533e-06, "epoch": 5.96969696969697, "percentage": 85.28, "elapsed_time": "3:44:52", "remaining_time": "0:38:48"}
198
+ {"current_steps": 198, "total_steps": 231, "loss": 0.1397, "lr": 1.2281739759740575e-06, "epoch": 6.0, "percentage": 85.71, "elapsed_time": "3:45:46", "remaining_time": "0:37:37"}
199
+ {"current_steps": 199, "total_steps": 231, "loss": 0.1333, "lr": 1.156314638334277e-06, "epoch": 6.03030303030303, "percentage": 86.15, "elapsed_time": "3:58:01", "remaining_time": "0:38:16"}
200
+ {"current_steps": 200, "total_steps": 231, "loss": 0.1451, "lr": 1.086492267732462e-06, "epoch": 6.0606060606060606, "percentage": 86.58, "elapsed_time": "3:58:56", "remaining_time": "0:37:02"}
201
+ {"current_steps": 201, "total_steps": 231, "loss": 0.1046, "lr": 1.01872294636304e-06, "epoch": 6.090909090909091, "percentage": 87.01, "elapsed_time": "3:59:45", "remaining_time": "0:35:47"}
202
+ {"current_steps": 202, "total_steps": 231, "loss": 0.1017, "lr": 9.530222835413739e-07, "epoch": 6.121212121212121, "percentage": 87.45, "elapsed_time": "4:00:25", "remaining_time": "0:34:30"}
203
+ {"current_steps": 203, "total_steps": 231, "loss": 0.1278, "lr": 8.894054121084839e-07, "epoch": 6.151515151515151, "percentage": 87.88, "elapsed_time": "4:01:16", "remaining_time": "0:33:16"}
204
+ {"current_steps": 204, "total_steps": 231, "loss": 0.1403, "lr": 8.278869849454718e-07, "epoch": 6.181818181818182, "percentage": 88.31, "elapsed_time": "4:02:14", "remaining_time": "0:32:03"}
205
+ {"current_steps": 205, "total_steps": 231, "loss": 0.1222, "lr": 7.684811715985429e-07, "epoch": 6.212121212121212, "percentage": 88.74, "elapsed_time": "4:03:14", "remaining_time": "0:30:50"}
206
+ {"current_steps": 206, "total_steps": 231, "loss": 0.1313, "lr": 7.1120165501533e-07, "epoch": 6.242424242424242, "percentage": 89.18, "elapsed_time": "4:04:04", "remaining_time": "0:29:37"}
207
+ {"current_steps": 207, "total_steps": 231, "loss": 0.1291, "lr": 6.560616283932897e-07, "epoch": 6.2727272727272725, "percentage": 89.61, "elapsed_time": "4:05:02", "remaining_time": "0:28:24"}
208
+ {"current_steps": 208, "total_steps": 231, "loss": 0.1534, "lr": 6.030737921409169e-07, "epoch": 6.303030303030303, "percentage": 90.04, "elapsed_time": "4:05:54", "remaining_time": "0:27:11"}
209
+ {"current_steps": 209, "total_steps": 231, "loss": 0.0873, "lr": 5.522503509524591e-07, "epoch": 6.333333333333333, "percentage": 90.48, "elapsed_time": "4:06:48", "remaining_time": "0:25:58"}
210
+ {"current_steps": 210, "total_steps": 231, "loss": 0.1134, "lr": 5.036030109968082e-07, "epoch": 6.363636363636363, "percentage": 90.91, "elapsed_time": "4:07:42", "remaining_time": "0:24:46"}