penfever commited on
Commit
d386e8a
·
verified ·
1 Parent(s): e39639a

Training in progress, step 7800

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d0e50885aaed73a8dfc4ac1b06e08fba79fa5503477defc3e6eeee34f6d045b7
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:31944b3141a126944cf97f77535e691f09d1c0e57638cea6a583ef12c7c2ba0e
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0e205cb24f15ca99742001709518e9a613878a0cc3829f6056bc58713cb37c61
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ec37270eb356ecab1545f31b544a15244602b4669893cda5c89590688893431
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:16e0bbb7eadc2c252853f9b37184b857d4577e550def9ec6b5bd8c3bfa42ff34
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf38094c335b7c24b410ce93eadd42a7ae97b94b1df74ed384a5b9260ce6aadc
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:538ab5256ac540e508280020dc51511c1044696e75ee5557226078b50c1862bf
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1777bf9c0dfc9c9833d945a93300f00a559e6ee8167baf963bbe562a26281a58
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -2242,3 +2242,33 @@
2242
  {"current_steps": 7655, "total_steps": 8169, "loss": 0.1288, "lr": 4.823361406800775e-07, "epoch": 6.55955441302485, "percentage": 93.71, "elapsed_time": "2:25:45", "remaining_time": "0:09:47"}
2243
  {"current_steps": 7660, "total_steps": 8169, "loss": 0.1205, "lr": 4.7305277346026523e-07, "epoch": 6.563838903170523, "percentage": 93.77, "elapsed_time": "2:28:36", "remaining_time": "0:09:52"}
2244
  {"current_steps": 7665, "total_steps": 8169, "loss": 0.1328, "lr": 4.6385854425258225e-07, "epoch": 6.5681233933161955, "percentage": 93.83, "elapsed_time": "2:31:24", "remaining_time": "0:09:57"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2242
  {"current_steps": 7655, "total_steps": 8169, "loss": 0.1288, "lr": 4.823361406800775e-07, "epoch": 6.55955441302485, "percentage": 93.71, "elapsed_time": "2:25:45", "remaining_time": "0:09:47"}
2243
  {"current_steps": 7660, "total_steps": 8169, "loss": 0.1205, "lr": 4.7305277346026523e-07, "epoch": 6.563838903170523, "percentage": 93.77, "elapsed_time": "2:28:36", "remaining_time": "0:09:52"}
2244
  {"current_steps": 7665, "total_steps": 8169, "loss": 0.1328, "lr": 4.6385854425258225e-07, "epoch": 6.5681233933161955, "percentage": 93.83, "elapsed_time": "2:31:24", "remaining_time": "0:09:57"}
2245
+ {"current_steps": 7670, "total_steps": 8169, "loss": 0.1214, "lr": 4.5475349502750675e-07, "epoch": 6.572407883461868, "percentage": 93.89, "elapsed_time": "2:34:13", "remaining_time": "0:10:02"}
2246
+ {"current_steps": 7675, "total_steps": 8169, "loss": 0.1274, "lr": 4.457376673484204e-07, "epoch": 6.576692373607541, "percentage": 93.95, "elapsed_time": "2:37:06", "remaining_time": "0:10:06"}
2247
+ {"current_steps": 7680, "total_steps": 8169, "loss": 0.1314, "lr": 4.3681110237142165e-07, "epoch": 6.580976863753214, "percentage": 94.01, "elapsed_time": "2:39:58", "remaining_time": "0:10:11"}
2248
+ {"current_steps": 7685, "total_steps": 8169, "loss": 0.1496, "lr": 4.279738408451395e-07, "epoch": 6.585261353898886, "percentage": 94.08, "elapsed_time": "2:42:37", "remaining_time": "0:10:14"}
2249
+ {"current_steps": 7690, "total_steps": 8169, "loss": 0.1273, "lr": 4.1922592311053776e-07, "epoch": 6.589545844044559, "percentage": 94.14, "elapsed_time": "2:45:27", "remaining_time": "0:10:18"}
2250
+ {"current_steps": 7695, "total_steps": 8169, "loss": 0.1216, "lr": 4.105673891007378e-07, "epoch": 6.593830334190232, "percentage": 94.2, "elapsed_time": "2:48:22", "remaining_time": "0:10:22"}
2251
+ {"current_steps": 7700, "total_steps": 8169, "loss": 0.1286, "lr": 4.0199827834084047e-07, "epoch": 6.598114824335904, "percentage": 94.26, "elapsed_time": "2:51:05", "remaining_time": "0:10:25"}
2252
+ {"current_steps": 7705, "total_steps": 8169, "loss": 0.1126, "lr": 3.9351862994774e-07, "epoch": 6.602399314481577, "percentage": 94.32, "elapsed_time": "2:53:56", "remaining_time": "0:10:28"}
2253
+ {"current_steps": 7710, "total_steps": 8169, "loss": 0.1278, "lr": 3.8512848262994175e-07, "epoch": 6.60668380462725, "percentage": 94.38, "elapsed_time": "2:56:50", "remaining_time": "0:10:31"}
2254
+ {"current_steps": 7715, "total_steps": 8169, "loss": 0.1345, "lr": 3.7682787468739544e-07, "epoch": 6.610968294772922, "percentage": 94.44, "elapsed_time": "2:59:38", "remaining_time": "0:10:34"}
2255
+ {"current_steps": 7720, "total_steps": 8169, "loss": 0.1301, "lr": 3.6861684401131135e-07, "epoch": 6.615252784918595, "percentage": 94.5, "elapsed_time": "3:02:22", "remaining_time": "0:10:36"}
2256
+ {"current_steps": 7725, "total_steps": 8169, "loss": 0.1228, "lr": 3.604954280839934e-07, "epoch": 6.619537275064268, "percentage": 94.56, "elapsed_time": "3:05:07", "remaining_time": "0:10:38"}
2257
+ {"current_steps": 7730, "total_steps": 8169, "loss": 0.1252, "lr": 3.524636639786616e-07, "epoch": 6.62382176520994, "percentage": 94.63, "elapsed_time": "3:07:53", "remaining_time": "0:10:40"}
2258
+ {"current_steps": 7735, "total_steps": 8169, "loss": 0.1346, "lr": 3.445215883592945e-07, "epoch": 6.628106255355613, "percentage": 94.69, "elapsed_time": "3:10:34", "remaining_time": "0:10:41"}
2259
+ {"current_steps": 7740, "total_steps": 8169, "loss": 0.1382, "lr": 3.36669237480447e-07, "epoch": 6.632390745501286, "percentage": 94.75, "elapsed_time": "3:13:28", "remaining_time": "0:10:43"}
2260
+ {"current_steps": 7745, "total_steps": 8169, "loss": 0.1432, "lr": 3.289066471870972e-07, "epoch": 6.636675235646958, "percentage": 94.81, "elapsed_time": "3:16:17", "remaining_time": "0:10:44"}
2261
+ {"current_steps": 7750, "total_steps": 8169, "loss": 0.1396, "lr": 3.2123385291447315e-07, "epoch": 6.640959725792631, "percentage": 94.87, "elapsed_time": "3:19:07", "remaining_time": "0:10:45"}
2262
+ {"current_steps": 7755, "total_steps": 8169, "loss": 0.1249, "lr": 3.136508896878976e-07, "epoch": 6.645244215938304, "percentage": 94.93, "elapsed_time": "3:21:55", "remaining_time": "0:10:46"}
2263
+ {"current_steps": 7760, "total_steps": 8169, "loss": 0.1377, "lr": 3.0615779212262773e-07, "epoch": 6.649528706083976, "percentage": 94.99, "elapsed_time": "3:24:42", "remaining_time": "0:10:47"}
2264
+ {"current_steps": 7765, "total_steps": 8169, "loss": 0.1272, "lr": 2.9875459442368915e-07, "epoch": 6.653813196229649, "percentage": 95.05, "elapsed_time": "3:27:33", "remaining_time": "0:10:47"}
2265
+ {"current_steps": 7770, "total_steps": 8169, "loss": 0.1389, "lr": 2.914413303857377e-07, "epoch": 6.658097686375322, "percentage": 95.12, "elapsed_time": "3:30:26", "remaining_time": "0:10:48"}
2266
+ {"current_steps": 7775, "total_steps": 8169, "loss": 0.1392, "lr": 2.8421803339288236e-07, "epoch": 6.662382176520994, "percentage": 95.18, "elapsed_time": "3:33:13", "remaining_time": "0:10:48"}
2267
+ {"current_steps": 7780, "total_steps": 8169, "loss": 0.1169, "lr": 2.7708473641854917e-07, "epoch": 6.666666666666667, "percentage": 95.24, "elapsed_time": "3:36:14", "remaining_time": "0:10:48"}
2268
+ {"current_steps": 7785, "total_steps": 8169, "loss": 0.1355, "lr": 2.7004147202532416e-07, "epoch": 6.67095115681234, "percentage": 95.3, "elapsed_time": "3:39:00", "remaining_time": "0:10:48"}
2269
+ {"current_steps": 7790, "total_steps": 8169, "loss": 0.126, "lr": 2.630882723648087e-07, "epoch": 6.675235646958012, "percentage": 95.36, "elapsed_time": "3:41:53", "remaining_time": "0:10:47"}
2270
+ {"current_steps": 7795, "total_steps": 8169, "loss": 0.1424, "lr": 2.5622516917746644e-07, "epoch": 6.679520137103685, "percentage": 95.42, "elapsed_time": "3:44:40", "remaining_time": "0:10:46"}
2271
+ {"current_steps": 7800, "total_steps": 8169, "loss": 0.1361, "lr": 2.494521937924854e-07, "epoch": 6.683804627249358, "percentage": 95.48, "elapsed_time": "3:47:42", "remaining_time": "0:10:46"}
2272
+ {"current_steps": 7805, "total_steps": 8169, "loss": 0.1218, "lr": 2.427693771276274e-07, "epoch": 6.68808911739503, "percentage": 95.54, "elapsed_time": "3:51:45", "remaining_time": "0:10:48"}
2273
+ {"current_steps": 7810, "total_steps": 8169, "loss": 0.1339, "lr": 2.3617674968909876e-07, "epoch": 6.692373607540703, "percentage": 95.61, "elapsed_time": "3:54:31", "remaining_time": "0:10:46"}
2274
+ {"current_steps": 7815, "total_steps": 8169, "loss": 0.1118, "lr": 2.2967434157139756e-07, "epoch": 6.696658097686376, "percentage": 95.67, "elapsed_time": "3:57:19", "remaining_time": "0:10:45"}