penfever commited on
Commit
0bb7961
·
verified ·
1 Parent(s): 76731bc

Training in progress, step 6200

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5fe2164a32210c2f757b9038450ac8a3ebcd09b0fa5be1d6b46aa064deb7e49a
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:68d6c6386a600613d3c47a73e7b96f600db162b111605056d7286307a5427ab5
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f9f6db7fd12a272ec3915e2de446692f15dcf34792fedc07b3b278607b609fb6
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ec9d4da97bf4ff8a801b1a3571052b5c5f6db2597c3f8a7755f6099f84d0b689
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0dadc1de14b16b0e4e9a8286930de8e13b6b8d53eea9553217dc4ead2858ee58
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:335032b14ba4d7f58fbd1707f6453910c9b2bc367fbee3666e6cdcc9976a5b92
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8892d3db17b47550012a8ec5b30a72b00875d049a4dcab465563bd9d9475c058
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c200192ab26a73f73681019168cd6493dd3087192021df8da32a697d36e6db21
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -1221,3 +1221,43 @@
1221
  {"current_steps": 5990, "total_steps": 6713, "loss": 0.1305, "lr": 1.4009498892523388e-06, "epoch": 6.247261345852895, "percentage": 89.23, "elapsed_time": "22:49:36", "remaining_time": "2:45:18"}
1222
  {"current_steps": 5995, "total_steps": 6713, "loss": 0.1365, "lr": 1.3818917843080848e-06, "epoch": 6.2524778299426185, "percentage": 89.3, "elapsed_time": "22:52:39", "remaining_time": "2:44:23"}
1223
  {"current_steps": 6000, "total_steps": 6713, "loss": 0.1538, "lr": 1.3629595595533673e-06, "epoch": 6.257694314032342, "percentage": 89.38, "elapsed_time": "22:55:32", "remaining_time": "2:43:27"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1221
  {"current_steps": 5990, "total_steps": 6713, "loss": 0.1305, "lr": 1.4009498892523388e-06, "epoch": 6.247261345852895, "percentage": 89.23, "elapsed_time": "22:49:36", "remaining_time": "2:45:18"}
1222
  {"current_steps": 5995, "total_steps": 6713, "loss": 0.1365, "lr": 1.3818917843080848e-06, "epoch": 6.2524778299426185, "percentage": 89.3, "elapsed_time": "22:52:39", "remaining_time": "2:44:23"}
1223
  {"current_steps": 6000, "total_steps": 6713, "loss": 0.1538, "lr": 1.3629595595533673e-06, "epoch": 6.257694314032342, "percentage": 89.38, "elapsed_time": "22:55:32", "remaining_time": "2:43:27"}
1224
+ {"current_steps": 6005, "total_steps": 6713, "loss": 0.1739, "lr": 1.3441533429921804e-06, "epoch": 6.262910798122066, "percentage": 89.45, "elapsed_time": "22:59:30", "remaining_time": "2:42:38"}
1225
+ {"current_steps": 6010, "total_steps": 6713, "loss": 0.1538, "lr": 1.3254732617765375e-06, "epoch": 6.26812728221179, "percentage": 89.53, "elapsed_time": "23:02:29", "remaining_time": "2:41:42"}
1226
+ {"current_steps": 6015, "total_steps": 6713, "loss": 0.1429, "lr": 1.3069194422056454e-06, "epoch": 6.273343766301513, "percentage": 89.6, "elapsed_time": "23:05:32", "remaining_time": "2:40:46"}
1227
+ {"current_steps": 6020, "total_steps": 6713, "loss": 0.1445, "lr": 1.2884920097250197e-06, "epoch": 6.278560250391236, "percentage": 89.68, "elapsed_time": "23:08:34", "remaining_time": "2:39:50"}
1228
+ {"current_steps": 6025, "total_steps": 6713, "loss": 0.1572, "lr": 1.2701910889256651e-06, "epoch": 6.28377673448096, "percentage": 89.75, "elapsed_time": "23:11:36", "remaining_time": "2:38:54"}
1229
+ {"current_steps": 6030, "total_steps": 6713, "loss": 0.1598, "lr": 1.2520168035432102e-06, "epoch": 6.288993218570683, "percentage": 89.83, "elapsed_time": "23:14:44", "remaining_time": "2:37:58"}
1230
+ {"current_steps": 6035, "total_steps": 6713, "loss": 0.1523, "lr": 1.2339692764570853e-06, "epoch": 6.294209702660407, "percentage": 89.9, "elapsed_time": "23:17:49", "remaining_time": "2:37:02"}
1231
+ {"current_steps": 6040, "total_steps": 6713, "loss": 0.1496, "lr": 1.2160486296896834e-06, "epoch": 6.29942618675013, "percentage": 89.97, "elapsed_time": "23:20:48", "remaining_time": "2:36:05"}
1232
+ {"current_steps": 6045, "total_steps": 6713, "loss": 0.1405, "lr": 1.198254984405538e-06, "epoch": 6.304642670839854, "percentage": 90.05, "elapsed_time": "23:23:52", "remaining_time": "2:35:08"}
1233
+ {"current_steps": 6050, "total_steps": 6713, "loss": 0.1409, "lr": 1.1805884609105012e-06, "epoch": 6.309859154929577, "percentage": 90.12, "elapsed_time": "23:26:55", "remaining_time": "2:34:10"}
1234
+ {"current_steps": 6055, "total_steps": 6713, "loss": 0.1945, "lr": 1.1630491786509457e-06, "epoch": 6.315075639019301, "percentage": 90.2, "elapsed_time": "23:29:59", "remaining_time": "2:33:13"}
1235
+ {"current_steps": 6060, "total_steps": 6713, "loss": 0.1398, "lr": 1.1456372562129281e-06, "epoch": 6.3202921231090246, "percentage": 90.27, "elapsed_time": "23:33:04", "remaining_time": "2:32:16"}
1236
+ {"current_steps": 6065, "total_steps": 6713, "loss": 0.142, "lr": 1.1283528113214114e-06, "epoch": 6.325508607198748, "percentage": 90.35, "elapsed_time": "23:36:09", "remaining_time": "2:31:18"}
1237
+ {"current_steps": 6070, "total_steps": 6713, "loss": 0.1496, "lr": 1.1111959608394662e-06, "epoch": 6.330725091288471, "percentage": 90.42, "elapsed_time": "23:39:03", "remaining_time": "2:30:19"}
1238
+ {"current_steps": 6075, "total_steps": 6713, "loss": 0.148, "lr": 1.094166820767464e-06, "epoch": 6.335941575378195, "percentage": 90.5, "elapsed_time": "23:42:05", "remaining_time": "2:29:20"}
1239
+ {"current_steps": 6080, "total_steps": 6713, "loss": 0.1295, "lr": 1.0772655062423176e-06, "epoch": 6.341158059467919, "percentage": 90.57, "elapsed_time": "23:45:12", "remaining_time": "2:28:22"}
1240
+ {"current_steps": 6085, "total_steps": 6713, "loss": 0.1453, "lr": 1.0604921315366767e-06, "epoch": 6.346374543557642, "percentage": 90.65, "elapsed_time": "23:48:14", "remaining_time": "2:27:24"}
1241
+ {"current_steps": 6090, "total_steps": 6713, "loss": 0.1346, "lr": 1.0438468100581823e-06, "epoch": 6.351591027647365, "percentage": 90.72, "elapsed_time": "23:51:19", "remaining_time": "2:26:25"}
1242
+ {"current_steps": 6095, "total_steps": 6713, "loss": 0.1349, "lr": 1.027329654348672e-06, "epoch": 6.356807511737089, "percentage": 90.79, "elapsed_time": "23:54:16", "remaining_time": "2:25:25"}
1243
+ {"current_steps": 6100, "total_steps": 6713, "loss": 0.141, "lr": 1.01094077608344e-06, "epoch": 6.362023995826813, "percentage": 90.87, "elapsed_time": "23:57:17", "remaining_time": "2:24:26"}
1244
+ {"current_steps": 6105, "total_steps": 6713, "loss": 0.1447, "lr": 9.946802860704706e-07, "epoch": 6.3672404799165365, "percentage": 90.94, "elapsed_time": "1 day, 0:00:19", "remaining_time": "2:23:26"}
1245
+ {"current_steps": 6110, "total_steps": 6713, "loss": 0.1348, "lr": 9.785482942497037e-07, "epoch": 6.372456964006259, "percentage": 91.02, "elapsed_time": "1 day, 0:03:24", "remaining_time": "2:22:27"}
1246
+ {"current_steps": 6115, "total_steps": 6713, "loss": 0.1453, "lr": 9.625449096922667e-07, "epoch": 6.377673448095983, "percentage": 91.09, "elapsed_time": "1 day, 0:06:28", "remaining_time": "2:21:27"}
1247
+ {"current_steps": 6120, "total_steps": 6713, "loss": 0.1483, "lr": 9.466702405997674e-07, "epoch": 6.382889932185707, "percentage": 91.17, "elapsed_time": "1 day, 0:09:32", "remaining_time": "2:20:27"}
1248
+ {"current_steps": 6125, "total_steps": 6713, "loss": 0.1517, "lr": 9.309243943035295e-07, "epoch": 6.388106416275431, "percentage": 91.24, "elapsed_time": "1 day, 0:12:33", "remaining_time": "2:19:26"}
1249
+ {"current_steps": 6130, "total_steps": 6713, "loss": 0.2047, "lr": 9.153074772638937e-07, "epoch": 6.3933229003651535, "percentage": 91.32, "elapsed_time": "1 day, 0:15:00", "remaining_time": "2:18:22"}
1250
+ {"current_steps": 6135, "total_steps": 6713, "loss": 0.2038, "lr": 8.99819595069491e-07, "epoch": 6.398539384454877, "percentage": 91.39, "elapsed_time": "1 day, 0:17:08", "remaining_time": "2:17:16"}
1251
+ {"current_steps": 6140, "total_steps": 6713, "loss": 0.2008, "lr": 8.844608524365172e-07, "epoch": 6.403755868544601, "percentage": 91.46, "elapsed_time": "1 day, 0:19:41", "remaining_time": "2:16:13"}
1252
+ {"current_steps": 6145, "total_steps": 6713, "loss": 0.1994, "lr": 8.692313532080443e-07, "epoch": 6.408972352634325, "percentage": 91.54, "elapsed_time": "1 day, 0:22:02", "remaining_time": "2:15:08"}
1253
+ {"current_steps": 6150, "total_steps": 6713, "loss": 0.2109, "lr": 8.54131200353292e-07, "epoch": 6.414188836724048, "percentage": 91.61, "elapsed_time": "1 day, 0:24:24", "remaining_time": "2:14:03"}
1254
+ {"current_steps": 6155, "total_steps": 6713, "loss": 0.2106, "lr": 8.391604959669619e-07, "epoch": 6.419405320813771, "percentage": 91.69, "elapsed_time": "1 day, 0:26:40", "remaining_time": "2:12:57"}
1255
+ {"current_steps": 6160, "total_steps": 6713, "loss": 0.205, "lr": 8.243193412685246e-07, "epoch": 6.424621804903495, "percentage": 91.76, "elapsed_time": "1 day, 0:29:09", "remaining_time": "2:11:53"}
1256
+ {"current_steps": 6165, "total_steps": 6713, "loss": 0.1979, "lr": 8.096078366015514e-07, "epoch": 6.429838288993219, "percentage": 91.84, "elapsed_time": "1 day, 0:31:22", "remaining_time": "2:10:47"}
1257
+ {"current_steps": 6170, "total_steps": 6713, "loss": 0.2106, "lr": 7.950260814330169e-07, "epoch": 6.435054773082942, "percentage": 91.91, "elapsed_time": "1 day, 0:33:44", "remaining_time": "2:09:41"}
1258
+ {"current_steps": 6175, "total_steps": 6713, "loss": 0.2041, "lr": 7.805741743526441e-07, "epoch": 6.4402712571726655, "percentage": 91.99, "elapsed_time": "1 day, 0:35:58", "remaining_time": "2:08:35"}
1259
+ {"current_steps": 6180, "total_steps": 6713, "loss": 0.2055, "lr": 7.662522130722294e-07, "epoch": 6.445487741262389, "percentage": 92.06, "elapsed_time": "1 day, 0:38:12", "remaining_time": "2:07:29"}
1260
+ {"current_steps": 6185, "total_steps": 6713, "loss": 0.1994, "lr": 7.520602944249855e-07, "epoch": 6.450704225352113, "percentage": 92.13, "elapsed_time": "1 day, 0:40:44", "remaining_time": "2:06:24"}
1261
+ {"current_steps": 6190, "total_steps": 6713, "loss": 0.2054, "lr": 7.379985143648815e-07, "epoch": 6.455920709441836, "percentage": 92.21, "elapsed_time": "1 day, 0:42:51", "remaining_time": "2:05:17"}
1262
+ {"current_steps": 6195, "total_steps": 6713, "loss": 0.196, "lr": 7.240669679660017e-07, "epoch": 6.46113719353156, "percentage": 92.28, "elapsed_time": "1 day, 0:44:46", "remaining_time": "2:04:09"}
1263
+ {"current_steps": 6200, "total_steps": 6713, "loss": 0.1998, "lr": 7.102657494218879e-07, "epoch": 6.466353677621283, "percentage": 92.36, "elapsed_time": "1 day, 0:46:30", "remaining_time": "2:02:59"}