penfever commited on
Commit
fcc9877
·
verified ·
1 Parent(s): 74929a9

Training in progress, step 2800

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ed736d6f7c92193fa39105250ee8628785bbfa9fd8a82000f32ef4b4a2c8fa57
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57cf8c832c8a54a49888f27ca061dcf57391b41ee7a577a222e48d0d560973eb
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dee4905203c42052bb46534282464873266a6bb7f2fc7b489f148233f0399430
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:570d048abd985767ce4674ca60ca2524ad9eb472da4d6c92bd4109452bda7ba6
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2ade83710eaf6411840e40f7b437f965db33c59317c59ba5b55397aa58e6b6c5
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:955fcf9ef3b923d40ff7363874cfb2910ed0c2d31e04a7b20e14ee93c58a251f
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:06548d1dbed959b57a2ac7c173fa275ed9a5f8247ffec1ba599344b63db3a668
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:629f6a97321b5fb54b9809f62b406e6dde10e97580d36b31ac37d0ee4f94670d
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -521,3 +521,40 @@
521
  {"current_steps": 2605, "total_steps": 3850, "loss": 0.2136, "lr": 1.1461450545963167e-05, "epoch": 4.737033666969973, "percentage": 67.66, "elapsed_time": "17:26:28", "remaining_time": "8:20:08"}
522
  {"current_steps": 2610, "total_steps": 3850, "loss": 0.2093, "lr": 1.137955017082521e-05, "epoch": 4.746132848043676, "percentage": 67.79, "elapsed_time": "17:28:10", "remaining_time": "8:17:59"}
523
  {"current_steps": 2615, "total_steps": 3850, "loss": 0.2091, "lr": 1.1297826954377587e-05, "epoch": 4.755232029117379, "percentage": 67.92, "elapsed_time": "17:30:09", "remaining_time": "8:15:57"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
521
  {"current_steps": 2605, "total_steps": 3850, "loss": 0.2136, "lr": 1.1461450545963167e-05, "epoch": 4.737033666969973, "percentage": 67.66, "elapsed_time": "17:26:28", "remaining_time": "8:20:08"}
522
  {"current_steps": 2610, "total_steps": 3850, "loss": 0.2093, "lr": 1.137955017082521e-05, "epoch": 4.746132848043676, "percentage": 67.79, "elapsed_time": "17:28:10", "remaining_time": "8:17:59"}
523
  {"current_steps": 2615, "total_steps": 3850, "loss": 0.2091, "lr": 1.1297826954377587e-05, "epoch": 4.755232029117379, "percentage": 67.92, "elapsed_time": "17:30:09", "remaining_time": "8:15:57"}
524
+ {"current_steps": 2620, "total_steps": 3850, "loss": 0.2153, "lr": 1.1216282576112436e-05, "epoch": 4.764331210191083, "percentage": 68.05, "elapsed_time": "17:32:10", "remaining_time": "8:13:57"}
525
+ {"current_steps": 2625, "total_steps": 3850, "loss": 0.197, "lr": 1.1134918711846651e-05, "epoch": 4.773430391264786, "percentage": 68.18, "elapsed_time": "17:34:02", "remaining_time": "8:11:53"}
526
+ {"current_steps": 2630, "total_steps": 3850, "loss": 0.1997, "lr": 1.1053737033687346e-05, "epoch": 4.78252957233849, "percentage": 68.31, "elapsed_time": "17:36:20", "remaining_time": "8:10:00"}
527
+ {"current_steps": 2635, "total_steps": 3850, "loss": 0.2081, "lr": 1.097273920999757e-05, "epoch": 4.791628753412192, "percentage": 68.44, "elapsed_time": "17:38:06", "remaining_time": "8:07:53"}
528
+ {"current_steps": 2640, "total_steps": 3850, "loss": 0.206, "lr": 1.0891926905361948e-05, "epoch": 4.800727934485896, "percentage": 68.57, "elapsed_time": "17:40:17", "remaining_time": "8:05:57"}
529
+ {"current_steps": 2645, "total_steps": 3850, "loss": 0.2003, "lr": 1.081130178055251e-05, "epoch": 4.8098271155595995, "percentage": 68.7, "elapsed_time": "17:42:17", "remaining_time": "8:03:57"}
530
+ {"current_steps": 2650, "total_steps": 3850, "loss": 0.2025, "lr": 1.0730865492494593e-05, "epoch": 4.818926296633303, "percentage": 68.83, "elapsed_time": "17:44:25", "remaining_time": "8:02:00"}
531
+ {"current_steps": 2655, "total_steps": 3850, "loss": 0.197, "lr": 1.0650619694232704e-05, "epoch": 4.828025477707007, "percentage": 68.96, "elapsed_time": "17:46:19", "remaining_time": "7:59:56"}
532
+ {"current_steps": 2660, "total_steps": 3850, "loss": 0.2221, "lr": 1.057056603489665e-05, "epoch": 4.837124658780709, "percentage": 69.09, "elapsed_time": "17:48:18", "remaining_time": "7:57:55"}
533
+ {"current_steps": 2665, "total_steps": 3850, "loss": 0.2016, "lr": 1.0490706159667534e-05, "epoch": 4.846223839854413, "percentage": 69.22, "elapsed_time": "17:50:25", "remaining_time": "7:55:58"}
534
+ {"current_steps": 2670, "total_steps": 3850, "loss": 0.2155, "lr": 1.0411041709744063e-05, "epoch": 4.855323020928116, "percentage": 69.35, "elapsed_time": "17:52:14", "remaining_time": "7:53:52"}
535
+ {"current_steps": 2675, "total_steps": 3850, "loss": 0.2296, "lr": 1.0331574322308722e-05, "epoch": 4.86442220200182, "percentage": 69.48, "elapsed_time": "17:54:13", "remaining_time": "7:51:51"}
536
+ {"current_steps": 2680, "total_steps": 3850, "loss": 0.2154, "lr": 1.0252305630494201e-05, "epoch": 4.8735213830755235, "percentage": 69.61, "elapsed_time": "17:56:05", "remaining_time": "7:49:47"}
537
+ {"current_steps": 2685, "total_steps": 3850, "loss": 0.218, "lr": 1.0173237263349776e-05, "epoch": 4.882620564149226, "percentage": 69.74, "elapsed_time": "17:57:54", "remaining_time": "7:47:41"}
538
+ {"current_steps": 2690, "total_steps": 3850, "loss": 0.2072, "lr": 1.0094370845807857e-05, "epoch": 4.89171974522293, "percentage": 69.87, "elapsed_time": "17:59:51", "remaining_time": "7:45:39"}
539
+ {"current_steps": 2695, "total_steps": 3850, "loss": 0.2087, "lr": 1.001570799865061e-05, "epoch": 4.900818926296633, "percentage": 70.0, "elapsed_time": "18:01:48", "remaining_time": "7:43:37"}
540
+ {"current_steps": 2700, "total_steps": 3850, "loss": 0.2025, "lr": 9.937250338476607e-06, "epoch": 4.909918107370337, "percentage": 70.13, "elapsed_time": "18:03:55", "remaining_time": "7:41:40"}
541
+ {"current_steps": 2705, "total_steps": 3850, "loss": 0.2104, "lr": 9.858999477667656e-06, "epoch": 4.91901728844404, "percentage": 70.26, "elapsed_time": "18:05:45", "remaining_time": "7:39:35"}
542
+ {"current_steps": 2710, "total_steps": 3850, "loss": 0.2153, "lr": 9.780957024355591e-06, "epoch": 4.928116469517743, "percentage": 70.39, "elapsed_time": "18:07:39", "remaining_time": "7:37:32"}
543
+ {"current_steps": 2715, "total_steps": 3850, "loss": 0.2035, "lr": 9.703124582389312e-06, "epoch": 4.937215650591447, "percentage": 70.52, "elapsed_time": "18:09:42", "remaining_time": "7:35:33"}
544
+ {"current_steps": 2720, "total_steps": 3850, "loss": 0.2095, "lr": 9.62550375130175e-06, "epoch": 4.94631483166515, "percentage": 70.65, "elapsed_time": "18:11:53", "remaining_time": "7:33:36"}
545
+ {"current_steps": 2725, "total_steps": 3850, "loss": 0.2038, "lr": 9.548096126277058e-06, "epoch": 4.955414012738854, "percentage": 70.78, "elapsed_time": "18:13:44", "remaining_time": "7:31:32"}
546
+ {"current_steps": 2730, "total_steps": 3850, "loss": 0.2149, "lr": 9.470903298117744e-06, "epoch": 4.964513193812557, "percentage": 70.91, "elapsed_time": "18:15:36", "remaining_time": "7:29:28"}
547
+ {"current_steps": 2735, "total_steps": 3850, "loss": 0.222, "lr": 9.393926853212083e-06, "epoch": 4.97361237488626, "percentage": 71.04, "elapsed_time": "18:17:39", "remaining_time": "7:27:29"}
548
+ {"current_steps": 2740, "total_steps": 3850, "loss": 0.2098, "lr": 9.317168373501426e-06, "epoch": 4.9827115559599635, "percentage": 71.17, "elapsed_time": "18:19:56", "remaining_time": "7:25:35"}
549
+ {"current_steps": 2745, "total_steps": 3850, "loss": 0.2084, "lr": 9.240629436447752e-06, "epoch": 4.991810737033667, "percentage": 71.3, "elapsed_time": "18:22:00", "remaining_time": "7:23:36"}
550
+ {"current_steps": 2750, "total_steps": 3850, "loss": 0.1959, "lr": 9.164311615001202e-06, "epoch": 5.0, "percentage": 71.43, "elapsed_time": "18:24:03", "remaining_time": "7:21:37"}
551
+ {"current_steps": 2755, "total_steps": 3850, "loss": 0.1955, "lr": 9.08821647756778e-06, "epoch": 5.0090991810737036, "percentage": 71.56, "elapsed_time": "18:25:53", "remaining_time": "7:19:32"}
552
+ {"current_steps": 2760, "total_steps": 3850, "loss": 0.1922, "lr": 9.012345587977129e-06, "epoch": 5.018198362147407, "percentage": 71.69, "elapsed_time": "18:27:36", "remaining_time": "7:17:25"}
553
+ {"current_steps": 2765, "total_steps": 3850, "loss": 0.1846, "lr": 8.936700505450356e-06, "epoch": 5.02729754322111, "percentage": 71.82, "elapsed_time": "18:29:31", "remaining_time": "7:15:23"}
554
+ {"current_steps": 2770, "total_steps": 3850, "loss": 0.1956, "lr": 8.861282784568045e-06, "epoch": 5.036396724294813, "percentage": 71.95, "elapsed_time": "18:31:20", "remaining_time": "7:13:18"}
555
+ {"current_steps": 2775, "total_steps": 3850, "loss": 0.1828, "lr": 8.786093975238226e-06, "epoch": 5.045495905368517, "percentage": 72.08, "elapsed_time": "18:33:27", "remaining_time": "7:11:20"}
556
+ {"current_steps": 2780, "total_steps": 3850, "loss": 0.2025, "lr": 8.711135622664622e-06, "epoch": 5.05459508644222, "percentage": 72.21, "elapsed_time": "18:35:08", "remaining_time": "7:09:12"}
557
+ {"current_steps": 2785, "total_steps": 3850, "loss": 0.1969, "lr": 8.636409267314806e-06, "epoch": 5.063694267515924, "percentage": 72.34, "elapsed_time": "18:36:54", "remaining_time": "7:07:06"}
558
+ {"current_steps": 2790, "total_steps": 3850, "loss": 0.1865, "lr": 8.561916444888618e-06, "epoch": 5.072793448589627, "percentage": 72.47, "elapsed_time": "18:38:58", "remaining_time": "7:05:07"}
559
+ {"current_steps": 2795, "total_steps": 3850, "loss": 0.194, "lr": 8.487658686286533e-06, "epoch": 5.08189262966333, "percentage": 72.6, "elapsed_time": "18:41:09", "remaining_time": "7:03:11"}
560
+ {"current_steps": 2800, "total_steps": 3850, "loss": 0.1857, "lr": 8.413637517578246e-06, "epoch": 5.090991810737034, "percentage": 72.73, "elapsed_time": "18:43:13", "remaining_time": "7:01:12"}