penfever commited on
Commit
41ed66e
·
verified ·
1 Parent(s): 32155db

Training in progress, step 12698

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a8a431f35c93cc45c5f0626f1ed8782b0cf3fad52044b60e5f67d52ae99bc342
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e0d79a9b23d10997c320b6d51ed2c9cf87c6f94b9fce7edbc7e506283e66d30
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bce38ef8ebbd02fe3e6301409b57f5c5319ad601a7c471afe4a12da35690f851
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fadaf539e8977a879e1242f027000e208a6c5568a99e4de59d2ad8be986fede6
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:62ca25b44abd5febd786205accf5229dfb958a5675223cc32c61e0987ef56e5d
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d80aa45a937a8923edf31a041143aaf27ddc9160c6754fed0106b0e1ab3dbba8
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:45d5b56bb5879c220019e6ec1f2ad00759a02d2ca8a1b33d32f54b3a0e9b741c
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d65e8c8ef7f2239cfc763366d0f98071d36428404f3897efd2c2013eb1fb27f
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -2429,3 +2429,112 @@
2429
  {"current_steps": 12145, "total_steps": 12698, "loss": 0.1629, "lr": 2.3149372546821258e-07, "epoch": 6.695148842337376, "percentage": 95.64, "elapsed_time": "21:41:50", "remaining_time": "0:59:16"}
2430
  {"current_steps": 12150, "total_steps": 12698, "loss": 0.166, "lr": 2.273418936204297e-07, "epoch": 6.697905181918412, "percentage": 95.68, "elapsed_time": "21:42:20", "remaining_time": "0:58:44"}
2431
  {"current_steps": 12155, "total_steps": 12698, "loss": 0.1622, "lr": 2.2322741810918202e-07, "epoch": 6.700661521499448, "percentage": 95.72, "elapsed_time": "21:42:45", "remaining_time": "0:58:11"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2429
  {"current_steps": 12145, "total_steps": 12698, "loss": 0.1629, "lr": 2.3149372546821258e-07, "epoch": 6.695148842337376, "percentage": 95.64, "elapsed_time": "21:41:50", "remaining_time": "0:59:16"}
2430
  {"current_steps": 12150, "total_steps": 12698, "loss": 0.166, "lr": 2.273418936204297e-07, "epoch": 6.697905181918412, "percentage": 95.68, "elapsed_time": "21:42:20", "remaining_time": "0:58:44"}
2431
  {"current_steps": 12155, "total_steps": 12698, "loss": 0.1622, "lr": 2.2322741810918202e-07, "epoch": 6.700661521499448, "percentage": 95.72, "elapsed_time": "21:42:45", "remaining_time": "0:58:11"}
2432
+ {"current_steps": 12160, "total_steps": 12698, "loss": 0.1701, "lr": 2.1915030670791594e-07, "epoch": 6.703417861080485, "percentage": 95.76, "elapsed_time": "21:43:10", "remaining_time": "0:57:39"}
2433
+ {"current_steps": 12165, "total_steps": 12698, "loss": 0.1775, "lr": 2.1511056711948751e-07, "epoch": 6.706174200661522, "percentage": 95.8, "elapsed_time": "21:43:36", "remaining_time": "0:57:07"}
2434
+ {"current_steps": 12170, "total_steps": 12698, "loss": 0.1748, "lr": 2.1110820697614943e-07, "epoch": 6.708930540242558, "percentage": 95.84, "elapsed_time": "21:44:03", "remaining_time": "0:56:34"}
2435
+ {"current_steps": 12175, "total_steps": 12698, "loss": 0.1671, "lr": 2.071432338395285e-07, "epoch": 6.711686879823594, "percentage": 95.88, "elapsed_time": "21:44:30", "remaining_time": "0:56:02"}
2436
+ {"current_steps": 12180, "total_steps": 12698, "loss": 0.1694, "lr": 2.0321565520061925e-07, "epoch": 6.714443219404631, "percentage": 95.92, "elapsed_time": "21:44:55", "remaining_time": "0:55:29"}
2437
+ {"current_steps": 12185, "total_steps": 12698, "loss": 0.1671, "lr": 1.9932547847976823e-07, "epoch": 6.7171995589856675, "percentage": 95.96, "elapsed_time": "21:45:23", "remaining_time": "0:54:57"}
2438
+ {"current_steps": 12190, "total_steps": 12698, "loss": 0.1368, "lr": 1.9547271102665854e-07, "epoch": 6.719955898566703, "percentage": 96.0, "elapsed_time": "21:45:57", "remaining_time": "0:54:25"}
2439
+ {"current_steps": 12195, "total_steps": 12698, "loss": 0.0831, "lr": 1.91657360120292e-07, "epoch": 6.722712238147739, "percentage": 96.04, "elapsed_time": "21:46:21", "remaining_time": "0:53:52"}
2440
+ {"current_steps": 12200, "total_steps": 12698, "loss": 0.074, "lr": 1.878794329689848e-07, "epoch": 6.725468577728776, "percentage": 96.08, "elapsed_time": "21:46:49", "remaining_time": "0:53:20"}
2441
+ {"current_steps": 12205, "total_steps": 12698, "loss": 0.0793, "lr": 1.8413893671034744e-07, "epoch": 6.728224917309813, "percentage": 96.12, "elapsed_time": "21:47:12", "remaining_time": "0:52:48"}
2442
+ {"current_steps": 12210, "total_steps": 12698, "loss": 0.07, "lr": 1.804358784112692e-07, "epoch": 6.730981256890849, "percentage": 96.16, "elapsed_time": "21:47:35", "remaining_time": "0:52:15"}
2443
+ {"current_steps": 12215, "total_steps": 12698, "loss": 0.0774, "lr": 1.7677026506791372e-07, "epoch": 6.733737596471885, "percentage": 96.2, "elapsed_time": "21:48:05", "remaining_time": "0:51:43"}
2444
+ {"current_steps": 12220, "total_steps": 12698, "loss": 0.1174, "lr": 1.731421036056946e-07, "epoch": 6.736493936052922, "percentage": 96.24, "elapsed_time": "21:48:30", "remaining_time": "0:51:11"}
2445
+ {"current_steps": 12225, "total_steps": 12698, "loss": 0.0881, "lr": 1.6955140087927314e-07, "epoch": 6.7392502756339585, "percentage": 96.28, "elapsed_time": "21:48:57", "remaining_time": "0:50:38"}
2446
+ {"current_steps": 12230, "total_steps": 12698, "loss": 0.0832, "lr": 1.6599816367253385e-07, "epoch": 6.7420066152149944, "percentage": 96.31, "elapsed_time": "21:49:22", "remaining_time": "0:50:06"}
2447
+ {"current_steps": 12235, "total_steps": 12698, "loss": 0.1087, "lr": 1.6248239869858463e-07, "epoch": 6.74476295479603, "percentage": 96.35, "elapsed_time": "21:50:19", "remaining_time": "0:49:35"}
2448
+ {"current_steps": 12240, "total_steps": 12698, "loss": 0.0634, "lr": 1.5900411259973214e-07, "epoch": 6.747519294377067, "percentage": 96.39, "elapsed_time": "21:50:51", "remaining_time": "0:49:03"}
2449
+ {"current_steps": 12245, "total_steps": 12698, "loss": 0.0732, "lr": 1.5556331194747755e-07, "epoch": 6.750275633958104, "percentage": 96.43, "elapsed_time": "21:51:28", "remaining_time": "0:48:31"}
2450
+ {"current_steps": 12250, "total_steps": 12698, "loss": 0.0728, "lr": 1.5216000324250079e-07, "epoch": 6.75303197353914, "percentage": 96.47, "elapsed_time": "21:52:03", "remaining_time": "0:47:59"}
2451
+ {"current_steps": 12255, "total_steps": 12698, "loss": 0.1143, "lr": 1.4879419291464747e-07, "epoch": 6.755788313120176, "percentage": 96.51, "elapsed_time": "21:52:36", "remaining_time": "0:47:26"}
2452
+ {"current_steps": 12260, "total_steps": 12698, "loss": 0.067, "lr": 1.4546588732291532e-07, "epoch": 6.758544652701213, "percentage": 96.55, "elapsed_time": "21:52:59", "remaining_time": "0:46:54"}
2453
+ {"current_steps": 12265, "total_steps": 12698, "loss": 0.0751, "lr": 1.4217509275545217e-07, "epoch": 6.76130099228225, "percentage": 96.59, "elapsed_time": "21:53:28", "remaining_time": "0:46:22"}
2454
+ {"current_steps": 12270, "total_steps": 12698, "loss": 0.0626, "lr": 1.3892181542952688e-07, "epoch": 6.7640573318632855, "percentage": 96.63, "elapsed_time": "21:53:51", "remaining_time": "0:45:49"}
2455
+ {"current_steps": 12275, "total_steps": 12698, "loss": 0.0766, "lr": 1.357060614915362e-07, "epoch": 6.766813671444321, "percentage": 96.67, "elapsed_time": "21:54:14", "remaining_time": "0:45:17"}
2456
+ {"current_steps": 12280, "total_steps": 12698, "loss": 0.0783, "lr": 1.3252783701698026e-07, "epoch": 6.769570011025358, "percentage": 96.71, "elapsed_time": "21:54:40", "remaining_time": "0:44:45"}
2457
+ {"current_steps": 12285, "total_steps": 12698, "loss": 0.084, "lr": 1.2938714801044916e-07, "epoch": 6.772326350606395, "percentage": 96.75, "elapsed_time": "21:55:13", "remaining_time": "0:44:12"}
2458
+ {"current_steps": 12290, "total_steps": 12698, "loss": 0.0814, "lr": 1.2628400040562983e-07, "epoch": 6.775082690187431, "percentage": 96.79, "elapsed_time": "21:55:35", "remaining_time": "0:43:40"}
2459
+ {"current_steps": 12295, "total_steps": 12698, "loss": 0.1097, "lr": 1.2321840006527475e-07, "epoch": 6.777839029768468, "percentage": 96.83, "elapsed_time": "21:56:14", "remaining_time": "0:43:08"}
2460
+ {"current_steps": 12300, "total_steps": 12698, "loss": 0.0699, "lr": 1.2019035278119983e-07, "epoch": 6.780595369349504, "percentage": 96.87, "elapsed_time": "21:56:36", "remaining_time": "0:42:36"}
2461
+ {"current_steps": 12305, "total_steps": 12698, "loss": 0.0774, "lr": 1.1719986427427111e-07, "epoch": 6.783351708930541, "percentage": 96.91, "elapsed_time": "21:56:56", "remaining_time": "0:42:03"}
2462
+ {"current_steps": 12310, "total_steps": 12698, "loss": 0.1031, "lr": 1.1424694019439575e-07, "epoch": 6.786108048511577, "percentage": 96.94, "elapsed_time": "21:57:22", "remaining_time": "0:41:31"}
2463
+ {"current_steps": 12315, "total_steps": 12698, "loss": 0.0894, "lr": 1.1133158612051331e-07, "epoch": 6.788864388092613, "percentage": 96.98, "elapsed_time": "21:57:59", "remaining_time": "0:40:59"}
2464
+ {"current_steps": 12320, "total_steps": 12698, "loss": 0.099, "lr": 1.084538075605801e-07, "epoch": 6.791620727673649, "percentage": 97.02, "elapsed_time": "21:58:31", "remaining_time": "0:40:27"}
2465
+ {"current_steps": 12325, "total_steps": 12698, "loss": 0.2354, "lr": 1.0561360995156034e-07, "epoch": 6.794377067254686, "percentage": 97.06, "elapsed_time": "21:59:18", "remaining_time": "0:39:55"}
2466
+ {"current_steps": 12330, "total_steps": 12698, "loss": 0.0844, "lr": 1.0281099865941946e-07, "epoch": 6.797133406835722, "percentage": 97.1, "elapsed_time": "21:59:50", "remaining_time": "0:39:23"}
2467
+ {"current_steps": 12335, "total_steps": 12698, "loss": 0.0831, "lr": 1.0004597897911084e-07, "epoch": 6.799889746416759, "percentage": 97.14, "elapsed_time": "22:00:16", "remaining_time": "0:38:51"}
2468
+ {"current_steps": 12340, "total_steps": 12698, "loss": 0.1682, "lr": 9.731855613456687e-08, "epoch": 6.802646085997795, "percentage": 97.18, "elapsed_time": "22:01:09", "remaining_time": "0:38:19"}
2469
+ {"current_steps": 12345, "total_steps": 12698, "loss": 0.0633, "lr": 9.462873527868343e-08, "epoch": 6.805402425578832, "percentage": 97.22, "elapsed_time": "22:01:37", "remaining_time": "0:37:47"}
2470
+ {"current_steps": 12350, "total_steps": 12698, "loss": 0.0847, "lr": 9.197652149332215e-08, "epoch": 6.808158765159868, "percentage": 97.26, "elapsed_time": "22:02:11", "remaining_time": "0:37:15"}
2471
+ {"current_steps": 12355, "total_steps": 12698, "loss": 0.0818, "lr": 8.936191978929254e-08, "epoch": 6.8109151047409044, "percentage": 97.3, "elapsed_time": "22:02:37", "remaining_time": "0:36:43"}
2472
+ {"current_steps": 12360, "total_steps": 12698, "loss": 0.0692, "lr": 8.678493510633656e-08, "epoch": 6.81367144432194, "percentage": 97.34, "elapsed_time": "22:03:09", "remaining_time": "0:36:11"}
2473
+ {"current_steps": 12365, "total_steps": 12698, "loss": 0.0679, "lr": 8.424557231313746e-08, "epoch": 6.816427783902977, "percentage": 97.38, "elapsed_time": "22:03:33", "remaining_time": "0:35:38"}
2474
+ {"current_steps": 12370, "total_steps": 12698, "loss": 0.0699, "lr": 8.174383620729087e-08, "epoch": 6.819184123484013, "percentage": 97.42, "elapsed_time": "22:03:53", "remaining_time": "0:35:06"}
2475
+ {"current_steps": 12375, "total_steps": 12698, "loss": 0.0668, "lr": 7.927973151531155e-08, "epoch": 6.82194046306505, "percentage": 97.46, "elapsed_time": "22:04:15", "remaining_time": "0:34:33"}
2476
+ {"current_steps": 12380, "total_steps": 12698, "loss": 0.1063, "lr": 7.685326289261108e-08, "epoch": 6.824696802646086, "percentage": 97.5, "elapsed_time": "22:04:49", "remaining_time": "0:34:01"}
2477
+ {"current_steps": 12385, "total_steps": 12698, "loss": 0.0643, "lr": 7.446443492350242e-08, "epoch": 6.827453142227123, "percentage": 97.54, "elapsed_time": "22:05:20", "remaining_time": "0:33:29"}
2478
+ {"current_steps": 12390, "total_steps": 12698, "loss": 0.0634, "lr": 7.211325212117759e-08, "epoch": 6.830209481808159, "percentage": 97.57, "elapsed_time": "22:05:43", "remaining_time": "0:32:57"}
2479
+ {"current_steps": 12395, "total_steps": 12698, "loss": 0.0637, "lr": 6.979971892770998e-08, "epoch": 6.8329658213891955, "percentage": 97.61, "elapsed_time": "22:06:05", "remaining_time": "0:32:25"}
2480
+ {"current_steps": 12400, "total_steps": 12698, "loss": 0.0648, "lr": 6.752383971404097e-08, "epoch": 6.835722160970231, "percentage": 97.65, "elapsed_time": "22:06:34", "remaining_time": "0:31:52"}
2481
+ {"current_steps": 12405, "total_steps": 12698, "loss": 0.1049, "lr": 6.528561877997108e-08, "epoch": 6.838478500551268, "percentage": 97.69, "elapsed_time": "22:07:20", "remaining_time": "0:31:21"}
2482
+ {"current_steps": 12410, "total_steps": 12698, "loss": 0.0923, "lr": 6.308506035415552e-08, "epoch": 6.841234840132304, "percentage": 97.73, "elapsed_time": "22:07:53", "remaining_time": "0:30:48"}
2483
+ {"current_steps": 12415, "total_steps": 12698, "loss": 0.0776, "lr": 6.092216859409306e-08, "epoch": 6.843991179713341, "percentage": 97.77, "elapsed_time": "22:08:17", "remaining_time": "0:30:16"}
2484
+ {"current_steps": 12420, "total_steps": 12698, "loss": 0.0911, "lr": 5.879694758611942e-08, "epoch": 6.846747519294377, "percentage": 97.81, "elapsed_time": "22:08:40", "remaining_time": "0:29:44"}
2485
+ {"current_steps": 12425, "total_steps": 12698, "loss": 0.1138, "lr": 5.6709401345396154e-08, "epoch": 6.849503858875414, "percentage": 97.85, "elapsed_time": "22:09:17", "remaining_time": "0:29:12"}
2486
+ {"current_steps": 12430, "total_steps": 12698, "loss": 0.0794, "lr": 5.4659533815912826e-08, "epoch": 6.85226019845645, "percentage": 97.89, "elapsed_time": "22:09:43", "remaining_time": "0:28:40"}
2487
+ {"current_steps": 12435, "total_steps": 12698, "loss": 0.0929, "lr": 5.264734887046707e-08, "epoch": 6.855016538037487, "percentage": 97.93, "elapsed_time": "22:10:08", "remaining_time": "0:28:07"}
2488
+ {"current_steps": 12440, "total_steps": 12698, "loss": 0.0744, "lr": 5.06728503106646e-08, "epoch": 6.8577728776185225, "percentage": 97.97, "elapsed_time": "22:10:29", "remaining_time": "0:27:35"}
2489
+ {"current_steps": 12445, "total_steps": 12698, "loss": 0.0725, "lr": 4.8736041866912496e-08, "epoch": 6.860529217199559, "percentage": 98.01, "elapsed_time": "22:11:00", "remaining_time": "0:27:03"}
2490
+ {"current_steps": 12450, "total_steps": 12698, "loss": 0.0782, "lr": 4.683692719840594e-08, "epoch": 6.863285556780595, "percentage": 98.05, "elapsed_time": "22:11:43", "remaining_time": "0:26:31"}
2491
+ {"current_steps": 12455, "total_steps": 12698, "loss": 0.068, "lr": 4.497550989313038e-08, "epoch": 6.866041896361632, "percentage": 98.09, "elapsed_time": "22:12:22", "remaining_time": "0:25:59"}
2492
+ {"current_steps": 12460, "total_steps": 12698, "loss": 0.0663, "lr": 4.315179346784826e-08, "epoch": 6.868798235942668, "percentage": 98.13, "elapsed_time": "22:12:47", "remaining_time": "0:25:27"}
2493
+ {"current_steps": 12465, "total_steps": 12698, "loss": 0.0756, "lr": 4.136578136809233e-08, "epoch": 6.871554575523705, "percentage": 98.17, "elapsed_time": "22:13:23", "remaining_time": "0:24:55"}
2494
+ {"current_steps": 12470, "total_steps": 12698, "loss": 0.0802, "lr": 3.96174769681612e-08, "epoch": 6.874310915104741, "percentage": 98.2, "elapsed_time": "22:14:05", "remaining_time": "0:24:23"}
2495
+ {"current_steps": 12475, "total_steps": 12698, "loss": 0.0848, "lr": 3.790688357111494e-08, "epoch": 6.877067254685778, "percentage": 98.24, "elapsed_time": "22:14:29", "remaining_time": "0:23:51"}
2496
+ {"current_steps": 12480, "total_steps": 12698, "loss": 0.0725, "lr": 3.62340044087639e-08, "epoch": 6.879823594266814, "percentage": 98.28, "elapsed_time": "22:14:50", "remaining_time": "0:23:19"}
2497
+ {"current_steps": 12485, "total_steps": 12698, "loss": 0.0712, "lr": 3.45988426416688e-08, "epoch": 6.88257993384785, "percentage": 98.32, "elapsed_time": "22:15:17", "remaining_time": "0:22:46"}
2498
+ {"current_steps": 12490, "total_steps": 12698, "loss": 0.0799, "lr": 3.3001401359125106e-08, "epoch": 6.885336273428886, "percentage": 98.36, "elapsed_time": "22:15:51", "remaining_time": "0:22:14"}
2499
+ {"current_steps": 12495, "total_steps": 12698, "loss": 0.0586, "lr": 3.1441683579167545e-08, "epoch": 6.888092613009923, "percentage": 98.4, "elapsed_time": "22:16:13", "remaining_time": "0:21:42"}
2500
+ {"current_steps": 12500, "total_steps": 12698, "loss": 0.0796, "lr": 2.991969224856117e-08, "epoch": 6.890848952590959, "percentage": 98.44, "elapsed_time": "22:16:38", "remaining_time": "0:21:10"}
2501
+ {"current_steps": 12505, "total_steps": 12698, "loss": 0.0739, "lr": 2.8435430242792496e-08, "epoch": 6.893605292171996, "percentage": 98.48, "elapsed_time": "22:17:04", "remaining_time": "0:20:38"}
2502
+ {"current_steps": 12510, "total_steps": 12698, "loss": 0.0832, "lr": 2.6988900366067274e-08, "epoch": 6.896361631753032, "percentage": 98.52, "elapsed_time": "22:17:35", "remaining_time": "0:20:06"}
2503
+ {"current_steps": 12515, "total_steps": 12698, "loss": 0.0762, "lr": 2.558010535130162e-08, "epoch": 6.899117971334069, "percentage": 98.56, "elapsed_time": "22:18:09", "remaining_time": "0:19:34"}
2504
+ {"current_steps": 12520, "total_steps": 12698, "loss": 0.0834, "lr": 2.4209047860122015e-08, "epoch": 6.901874310915105, "percentage": 98.6, "elapsed_time": "22:18:30", "remaining_time": "0:19:01"}
2505
+ {"current_steps": 12525, "total_steps": 12698, "loss": 0.0779, "lr": 2.2875730482856405e-08, "epoch": 6.904630650496141, "percentage": 98.64, "elapsed_time": "22:19:01", "remaining_time": "0:18:29"}
2506
+ {"current_steps": 12530, "total_steps": 12698, "loss": 0.0834, "lr": 2.1580155738534226e-08, "epoch": 6.907386990077177, "percentage": 98.68, "elapsed_time": "22:19:30", "remaining_time": "0:17:57"}
2507
+ {"current_steps": 12535, "total_steps": 12698, "loss": 0.076, "lr": 2.0322326074875277e-08, "epoch": 6.910143329658214, "percentage": 98.72, "elapsed_time": "22:19:55", "remaining_time": "0:17:25"}
2508
+ {"current_steps": 12540, "total_steps": 12698, "loss": 0.0686, "lr": 1.9102243868285298e-08, "epoch": 6.91289966923925, "percentage": 98.76, "elapsed_time": "22:20:16", "remaining_time": "0:16:53"}
2509
+ {"current_steps": 12545, "total_steps": 12698, "loss": 0.0849, "lr": 1.791991142385596e-08, "epoch": 6.915656008820287, "percentage": 98.8, "elapsed_time": "22:20:56", "remaining_time": "0:16:21"}
2510
+ {"current_steps": 12550, "total_steps": 12698, "loss": 0.0731, "lr": 1.677533097536266e-08, "epoch": 6.918412348401323, "percentage": 98.83, "elapsed_time": "22:21:23", "remaining_time": "0:15:49"}
2511
+ {"current_steps": 12555, "total_steps": 12698, "loss": 0.0653, "lr": 1.5668504685251163e-08, "epoch": 6.92116868798236, "percentage": 98.87, "elapsed_time": "22:21:51", "remaining_time": "0:15:17"}
2512
+ {"current_steps": 12560, "total_steps": 12698, "loss": 0.0732, "lr": 1.4599434644639866e-08, "epoch": 6.923925027563396, "percentage": 98.91, "elapsed_time": "22:22:29", "remaining_time": "0:14:45"}
2513
+ {"current_steps": 12565, "total_steps": 12698, "loss": 0.0641, "lr": 1.3568122873313106e-08, "epoch": 6.9266813671444325, "percentage": 98.95, "elapsed_time": "22:22:55", "remaining_time": "0:14:12"}
2514
+ {"current_steps": 12570, "total_steps": 12698, "loss": 0.0628, "lr": 1.2574571319723395e-08, "epoch": 6.929437706725468, "percentage": 98.99, "elapsed_time": "22:23:19", "remaining_time": "0:13:40"}
2515
+ {"current_steps": 12575, "total_steps": 12698, "loss": 0.081, "lr": 1.161878186098031e-08, "epoch": 6.932194046306505, "percentage": 99.03, "elapsed_time": "22:23:47", "remaining_time": "0:13:08"}
2516
+ {"current_steps": 12580, "total_steps": 12698, "loss": 0.0896, "lr": 1.070075630284828e-08, "epoch": 6.934950385887541, "percentage": 99.07, "elapsed_time": "22:24:22", "remaining_time": "0:12:36"}
2517
+ {"current_steps": 12585, "total_steps": 12698, "loss": 0.0727, "lr": 9.820496379748801e-09, "epoch": 6.937706725468578, "percentage": 99.11, "elapsed_time": "22:24:46", "remaining_time": "0:12:04"}
2518
+ {"current_steps": 12590, "total_steps": 12698, "loss": 0.0757, "lr": 8.978003754744891e-09, "epoch": 6.940463065049614, "percentage": 99.15, "elapsed_time": "22:25:13", "remaining_time": "0:11:32"}
2519
+ {"current_steps": 12595, "total_steps": 12698, "loss": 0.0926, "lr": 8.17328001955886e-09, "epoch": 6.943219404630651, "percentage": 99.19, "elapsed_time": "22:25:35", "remaining_time": "0:11:00"}
2520
+ {"current_steps": 12600, "total_steps": 12698, "loss": 0.07, "lr": 7.406326694543442e-09, "epoch": 6.945975744211687, "percentage": 99.23, "elapsed_time": "22:25:56", "remaining_time": "0:10:28"}
2521
+ {"current_steps": 12605, "total_steps": 12698, "loss": 0.0743, "lr": 6.677145228699555e-09, "epoch": 6.948732083792724, "percentage": 99.27, "elapsed_time": "22:26:19", "remaining_time": "0:09:55"}
2522
+ {"current_steps": 12610, "total_steps": 12698, "loss": 0.0709, "lr": 5.985736999665204e-09, "epoch": 6.9514884233737595, "percentage": 99.31, "elapsed_time": "22:26:44", "remaining_time": "0:09:23"}
2523
+ {"current_steps": 12615, "total_steps": 12698, "loss": 0.105, "lr": 5.332103313713255e-09, "epoch": 6.954244762954796, "percentage": 99.35, "elapsed_time": "22:27:21", "remaining_time": "0:08:51"}
2524
+ {"current_steps": 12620, "total_steps": 12698, "loss": 0.0827, "lr": 4.716245405747e-09, "epoch": 6.957001102535832, "percentage": 99.39, "elapsed_time": "22:28:00", "remaining_time": "0:08:19"}
2525
+ {"current_steps": 12625, "total_steps": 12698, "loss": 0.0702, "lr": 4.138164439304593e-09, "epoch": 6.959757442116869, "percentage": 99.43, "elapsed_time": "22:28:25", "remaining_time": "0:07:47"}
2526
+ {"current_steps": 12630, "total_steps": 12698, "loss": 0.0699, "lr": 3.5978615065479504e-09, "epoch": 6.962513781697905, "percentage": 99.46, "elapsed_time": "22:28:47", "remaining_time": "0:07:15"}
2527
+ {"current_steps": 12635, "total_steps": 12698, "loss": 0.0686, "lr": 3.0953376282694126e-09, "epoch": 6.965270121278942, "percentage": 99.5, "elapsed_time": "22:29:09", "remaining_time": "0:06:43"}
2528
+ {"current_steps": 12640, "total_steps": 12698, "loss": 0.0622, "lr": 2.6305937538828595e-09, "epoch": 6.968026460859978, "percentage": 99.54, "elapsed_time": "22:29:29", "remaining_time": "0:06:11"}
2529
+ {"current_steps": 12645, "total_steps": 12698, "loss": 0.0861, "lr": 2.203630761423714e-09, "epoch": 6.970782800441015, "percentage": 99.58, "elapsed_time": "22:29:50", "remaining_time": "0:05:39"}
2530
+ {"current_steps": 12650, "total_steps": 12698, "loss": 0.0626, "lr": 1.81444945755338e-09, "epoch": 6.9735391400220506, "percentage": 99.62, "elapsed_time": "22:30:14", "remaining_time": "0:05:07"}
2531
+ {"current_steps": 12655, "total_steps": 12698, "loss": 0.068, "lr": 1.4630505775459213e-09, "epoch": 6.976295479603087, "percentage": 99.66, "elapsed_time": "22:30:36", "remaining_time": "0:04:35"}
2532
+ {"current_steps": 12660, "total_steps": 12698, "loss": 0.069, "lr": 1.1494347852991639e-09, "epoch": 6.979051819184123, "percentage": 99.7, "elapsed_time": "22:31:00", "remaining_time": "0:04:03"}
2533
+ {"current_steps": 12665, "total_steps": 12698, "loss": 0.0716, "lr": 8.736026733213721e-10, "epoch": 6.98180815876516, "percentage": 99.74, "elapsed_time": "22:31:35", "remaining_time": "0:03:31"}
2534
+ {"current_steps": 12670, "total_steps": 12698, "loss": 0.0615, "lr": 6.355547627445724e-10, "epoch": 6.984564498346196, "percentage": 99.78, "elapsed_time": "22:32:05", "remaining_time": "0:02:59"}
2535
+ {"current_steps": 12675, "total_steps": 12698, "loss": 0.0674, "lr": 4.352915033090099e-10, "epoch": 6.987320837927233, "percentage": 99.82, "elapsed_time": "22:32:37", "remaining_time": "0:02:27"}
2536
+ {"current_steps": 12680, "total_steps": 12698, "loss": 0.1008, "lr": 2.728132733720301e-10, "epoch": 6.990077177508269, "percentage": 99.86, "elapsed_time": "22:33:36", "remaining_time": "0:01:55"}
2537
+ {"current_steps": 12685, "total_steps": 12698, "loss": 0.1177, "lr": 1.4812037989919702e-10, "epoch": 6.992833517089306, "percentage": 99.9, "elapsed_time": "22:34:19", "remaining_time": "0:01:23"}
2538
+ {"current_steps": 12690, "total_steps": 12698, "loss": 0.0691, "lr": 6.121305847317516e-11, "epoch": 6.995589856670342, "percentage": 99.94, "elapsed_time": "22:34:49", "remaining_time": "0:00:51"}
2539
+ {"current_steps": 12695, "total_steps": 12698, "loss": 0.0655, "lr": 1.2091473289288502e-11, "epoch": 6.998346196251378, "percentage": 99.98, "elapsed_time": "22:35:14", "remaining_time": "0:00:19"}
2540
+ {"current_steps": 12698, "total_steps": 12698, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "22:36:52", "remaining_time": "0:00:00"}