penfever commited on
Commit
9bd2fe6
·
verified ·
1 Parent(s): 5d63584

Training in progress, step 2800

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4ab1fdf0c413b4767720ea72da4ae766833afebf20ceabcb95e4d03539893361
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fe49fd9bd2f882588e602838b30971cf5694993272ecbfa2997126fd3193e8f
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:175e7c39a3a58d3534dbd5b3d915872099f444ae92df6060f7bbfee8304a1ddd
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0518aa0e7dfbded2bb0e3298a264a413c66628018a77033f9cf091e15c6dcae0
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bd9b22f36c96bb1697305c92cebbb2555d67992a962a95cac4cc101468ed60a6
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22867dbbd5cd67b827c3e180eab2a6621dbd322ed6d94f3049727cc0b06dee9b
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c1e6f09391251382839f0daa2c342183fdbf92164643c2fb5a90ff0ef4c77bd7
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5732a9ec4ebde10fd74867c714367357318fa3f0472913239f1c9f1b323b8ac
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -522,3 +522,42 @@
522
  {"current_steps": 2610, "total_steps": 2814, "loss": 0.175, "lr": 6.434834189402716e-07, "epoch": 6.492537313432836, "percentage": 92.75, "elapsed_time": "5:17:13", "remaining_time": "0:24:47"}
523
  {"current_steps": 2615, "total_steps": 2814, "loss": 0.1819, "lr": 6.126360832905831e-07, "epoch": 6.5049751243781095, "percentage": 92.93, "elapsed_time": "5:17:47", "remaining_time": "0:24:10"}
524
  {"current_steps": 2620, "total_steps": 2814, "loss": 0.1779, "lr": 5.825349037875106e-07, "epoch": 6.517412935323383, "percentage": 93.11, "elapsed_time": "5:18:24", "remaining_time": "0:23:34"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
522
  {"current_steps": 2610, "total_steps": 2814, "loss": 0.175, "lr": 6.434834189402716e-07, "epoch": 6.492537313432836, "percentage": 92.75, "elapsed_time": "5:17:13", "remaining_time": "0:24:47"}
523
  {"current_steps": 2615, "total_steps": 2814, "loss": 0.1819, "lr": 6.126360832905831e-07, "epoch": 6.5049751243781095, "percentage": 92.93, "elapsed_time": "5:17:47", "remaining_time": "0:24:10"}
524
  {"current_steps": 2620, "total_steps": 2814, "loss": 0.1779, "lr": 5.825349037875106e-07, "epoch": 6.517412935323383, "percentage": 93.11, "elapsed_time": "5:18:24", "remaining_time": "0:23:34"}
525
+ {"current_steps": 2625, "total_steps": 2814, "loss": 0.1601, "lr": 5.531810389268732e-07, "epoch": 6.529850746268656, "percentage": 93.28, "elapsed_time": "5:18:59", "remaining_time": "0:22:58"}
526
+ {"current_steps": 2630, "total_steps": 2814, "loss": 0.1744, "lr": 5.245756184428041e-07, "epoch": 6.54228855721393, "percentage": 93.46, "elapsed_time": "5:19:36", "remaining_time": "0:22:21"}
527
+ {"current_steps": 2635, "total_steps": 2814, "loss": 0.176, "lr": 4.967197432642579e-07, "epoch": 6.554726368159204, "percentage": 93.64, "elapsed_time": "5:20:11", "remaining_time": "0:21:45"}
528
+ {"current_steps": 2640, "total_steps": 2814, "loss": 0.1765, "lr": 4.69614485472647e-07, "epoch": 6.567164179104478, "percentage": 93.82, "elapsed_time": "5:20:43", "remaining_time": "0:21:08"}
529
+ {"current_steps": 2645, "total_steps": 2814, "loss": 0.1724, "lr": 4.432608882605771e-07, "epoch": 6.579601990049751, "percentage": 93.99, "elapsed_time": "5:21:18", "remaining_time": "0:20:31"}
530
+ {"current_steps": 2650, "total_steps": 2814, "loss": 0.1807, "lr": 4.1765996589170353e-07, "epoch": 6.592039800995025, "percentage": 94.17, "elapsed_time": "5:21:57", "remaining_time": "0:19:55"}
531
+ {"current_steps": 2655, "total_steps": 2814, "loss": 0.1752, "lr": 3.928127036616869e-07, "epoch": 6.604477611940299, "percentage": 94.35, "elapsed_time": "5:22:32", "remaining_time": "0:19:18"}
532
+ {"current_steps": 2660, "total_steps": 2814, "loss": 0.1723, "lr": 3.687200578602812e-07, "epoch": 6.616915422885572, "percentage": 94.53, "elapsed_time": "5:23:11", "remaining_time": "0:18:42"}
533
+ {"current_steps": 2665, "total_steps": 2814, "loss": 0.1626, "lr": 3.453829557345212e-07, "epoch": 6.629353233830845, "percentage": 94.71, "elapsed_time": "5:23:43", "remaining_time": "0:18:05"}
534
+ {"current_steps": 2670, "total_steps": 2814, "loss": 0.1778, "lr": 3.228022954530463e-07, "epoch": 6.641791044776119, "percentage": 94.88, "elapsed_time": "5:24:10", "remaining_time": "0:17:29"}
535
+ {"current_steps": 2675, "total_steps": 2814, "loss": 0.1902, "lr": 3.009789460715218e-07, "epoch": 6.654228855721393, "percentage": 95.06, "elapsed_time": "5:24:40", "remaining_time": "0:16:52"}
536
+ {"current_steps": 2680, "total_steps": 2814, "loss": 0.1784, "lr": 2.799137474991942e-07, "epoch": 6.666666666666667, "percentage": 95.24, "elapsed_time": "5:25:17", "remaining_time": "0:16:15"}
537
+ {"current_steps": 2685, "total_steps": 2814, "loss": 0.1733, "lr": 2.5960751046657296e-07, "epoch": 6.67910447761194, "percentage": 95.42, "elapsed_time": "5:25:51", "remaining_time": "0:15:39"}
538
+ {"current_steps": 2690, "total_steps": 2814, "loss": 0.1679, "lr": 2.400610164942241e-07, "epoch": 6.691542288557214, "percentage": 95.59, "elapsed_time": "5:26:26", "remaining_time": "0:15:02"}
539
+ {"current_steps": 2695, "total_steps": 2814, "loss": 0.169, "lr": 2.2127501786268546e-07, "epoch": 6.703980099502488, "percentage": 95.77, "elapsed_time": "5:26:59", "remaining_time": "0:14:26"}
540
+ {"current_steps": 2700, "total_steps": 2814, "loss": 0.1741, "lr": 2.0325023758352545e-07, "epoch": 6.7164179104477615, "percentage": 95.95, "elapsed_time": "5:27:35", "remaining_time": "0:13:49"}
541
+ {"current_steps": 2705, "total_steps": 2814, "loss": 0.1756, "lr": 1.859873693715075e-07, "epoch": 6.7288557213930345, "percentage": 96.13, "elapsed_time": "5:28:11", "remaining_time": "0:13:13"}
542
+ {"current_steps": 2710, "total_steps": 2814, "loss": 0.1751, "lr": 1.6948707761789807e-07, "epoch": 6.741293532338308, "percentage": 96.3, "elapsed_time": "5:28:47", "remaining_time": "0:12:37"}
543
+ {"current_steps": 2715, "total_steps": 2814, "loss": 0.1703, "lr": 1.5374999736488927e-07, "epoch": 6.753731343283582, "percentage": 96.48, "elapsed_time": "5:29:23", "remaining_time": "0:12:00"}
544
+ {"current_steps": 2720, "total_steps": 2814, "loss": 0.179, "lr": 1.3877673428116302e-07, "epoch": 6.766169154228856, "percentage": 96.66, "elapsed_time": "5:30:02", "remaining_time": "0:11:24"}
545
+ {"current_steps": 2725, "total_steps": 2814, "loss": 0.1668, "lr": 1.245678646385784e-07, "epoch": 6.778606965174129, "percentage": 96.84, "elapsed_time": "5:30:37", "remaining_time": "0:10:47"}
546
+ {"current_steps": 2730, "total_steps": 2814, "loss": 0.1738, "lr": 1.1112393529000288e-07, "epoch": 6.791044776119403, "percentage": 97.01, "elapsed_time": "5:31:12", "remaining_time": "0:10:11"}
547
+ {"current_steps": 2735, "total_steps": 2814, "loss": 0.1721, "lr": 9.844546364824459e-08, "epoch": 6.803482587064677, "percentage": 97.19, "elapsed_time": "5:31:47", "remaining_time": "0:09:35"}
548
+ {"current_steps": 2740, "total_steps": 2814, "loss": 0.1702, "lr": 8.653293766615945e-08, "epoch": 6.8159203980099505, "percentage": 97.37, "elapsed_time": "5:32:22", "remaining_time": "0:08:58"}
549
+ {"current_steps": 2745, "total_steps": 2814, "loss": 0.176, "lr": 7.538681581785945e-08, "epoch": 6.8283582089552235, "percentage": 97.55, "elapsed_time": "5:32:57", "remaining_time": "0:08:22"}
550
+ {"current_steps": 2750, "total_steps": 2814, "loss": 0.1778, "lr": 6.50075270810735e-08, "epoch": 6.840796019900497, "percentage": 97.73, "elapsed_time": "5:33:37", "remaining_time": "0:07:45"}
551
+ {"current_steps": 2755, "total_steps": 2814, "loss": 0.1763, "lr": 5.539547092063391e-08, "epoch": 6.853233830845771, "percentage": 97.9, "elapsed_time": "5:34:11", "remaining_time": "0:07:09"}
552
+ {"current_steps": 2760, "total_steps": 2814, "loss": 0.168, "lr": 4.655101727310651e-08, "epoch": 6.865671641791045, "percentage": 98.08, "elapsed_time": "5:34:41", "remaining_time": "0:06:32"}
553
+ {"current_steps": 2765, "total_steps": 2814, "loss": 0.1831, "lr": 3.847450653254425e-08, "epoch": 6.878109452736318, "percentage": 98.26, "elapsed_time": "5:35:15", "remaining_time": "0:05:56"}
554
+ {"current_steps": 2770, "total_steps": 2814, "loss": 0.1747, "lr": 3.1166249537402104e-08, "epoch": 6.890547263681592, "percentage": 98.44, "elapsed_time": "5:35:51", "remaining_time": "0:05:20"}
555
+ {"current_steps": 2775, "total_steps": 2814, "loss": 0.1684, "lr": 2.4626527558551106e-08, "epoch": 6.902985074626866, "percentage": 98.61, "elapsed_time": "5:36:23", "remaining_time": "0:04:43"}
556
+ {"current_steps": 2780, "total_steps": 2814, "loss": 0.1753, "lr": 1.885559228847811e-08, "epoch": 6.91542288557214, "percentage": 98.79, "elapsed_time": "5:37:00", "remaining_time": "0:04:07"}
557
+ {"current_steps": 2785, "total_steps": 2814, "loss": 0.1767, "lr": 1.385366583158243e-08, "epoch": 6.927860696517413, "percentage": 98.97, "elapsed_time": "5:37:30", "remaining_time": "0:03:30"}
558
+ {"current_steps": 2790, "total_steps": 2814, "loss": 0.183, "lr": 9.620940695633797e-09, "epoch": 6.940298507462686, "percentage": 99.15, "elapsed_time": "5:38:03", "remaining_time": "0:02:54"}
559
+ {"current_steps": 2795, "total_steps": 2814, "loss": 0.1744, "lr": 6.15757978435827e-09, "epoch": 6.95273631840796, "percentage": 99.32, "elapsed_time": "5:38:41", "remaining_time": "0:02:18"}
560
+ {"current_steps": 2800, "total_steps": 2814, "loss": 0.1799, "lr": 3.463716391176597e-09, "epoch": 6.965174129353234, "percentage": 99.5, "elapsed_time": "5:39:18", "remaining_time": "0:01:41"}
561
+ {"current_steps": 2805, "total_steps": 2814, "loss": 0.1691, "lr": 1.5394541940705332e-09, "epoch": 6.977611940298507, "percentage": 99.68, "elapsed_time": "5:40:53", "remaining_time": "0:01:05"}
562
+ {"current_steps": 2810, "total_steps": 2814, "loss": 0.1735, "lr": 3.848672515882612e-10, "epoch": 6.990049751243781, "percentage": 99.86, "elapsed_time": "5:41:27", "remaining_time": "0:00:29"}
563
+ {"current_steps": 2814, "total_steps": 2814, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "5:42:31", "remaining_time": "0:00:00"}