penfever commited on
Commit
5d5a8ed
·
verified ·
1 Parent(s): 4f84be0

Training in progress, step 3752

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b072d70b85be7646f7c771ae94c05893ed00a165c4dcd87ce37cf50e2312bced
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ebf20cd4913d818e2968a235d5bcc18d45ad3778efc115ec7e0a5605cdc4576
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:11f3a9b511268a9ed8ee2963a1c076d749fc9c24703249d34789b63b430cd0a4
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07682ac7a74c482cb3d8773e23ced05281e1871ad1dc98b9d7201e94f4669ee6
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b2d2e4042770f75a970d5480d44f4b3e9266e5e90579a4668bcb855a901015b
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b0b3eb72e68f2b1de79f236577ed2fcada7ea1d8a1bd9077688ba159ee43dc02
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3cd9154a5a3386b31a2e2568e320d916d70372cf3e6b8b58d8867ce92244b52f
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1756c7ee76fcef884196eb6483affce9a878daab832fafb7be57cee37bbd8bc6
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -719,3 +719,33 @@
719
  {"current_steps": 3595, "total_steps": 3752, "loss": 0.1944, "lr": 2.157876237211487e-07, "epoch": 6.707749766573296, "percentage": 95.82, "elapsed_time": "1 day, 2:27:20", "remaining_time": "1:09:19"}
720
  {"current_steps": 3600, "total_steps": 3752, "loss": 0.1948, "lr": 2.0236899311970593e-07, "epoch": 6.717086834733894, "percentage": 95.95, "elapsed_time": "1 day, 2:29:30", "remaining_time": "1:07:06"}
721
  {"current_steps": 3605, "total_steps": 3752, "loss": 0.2016, "lr": 1.8937895773529114e-07, "epoch": 6.726423902894491, "percentage": 96.08, "elapsed_time": "1 day, 2:32:39", "remaining_time": "1:04:56"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
719
  {"current_steps": 3595, "total_steps": 3752, "loss": 0.1944, "lr": 2.157876237211487e-07, "epoch": 6.707749766573296, "percentage": 95.82, "elapsed_time": "1 day, 2:27:20", "remaining_time": "1:09:19"}
720
  {"current_steps": 3600, "total_steps": 3752, "loss": 0.1948, "lr": 2.0236899311970593e-07, "epoch": 6.717086834733894, "percentage": 95.95, "elapsed_time": "1 day, 2:29:30", "remaining_time": "1:07:06"}
721
  {"current_steps": 3605, "total_steps": 3752, "loss": 0.2016, "lr": 1.8937895773529114e-07, "epoch": 6.726423902894491, "percentage": 96.08, "elapsed_time": "1 day, 2:32:39", "remaining_time": "1:04:56"}
722
+ {"current_steps": 3610, "total_steps": 3752, "loss": 0.1939, "lr": 1.7681779878675697e-07, "epoch": 6.735760971055089, "percentage": 96.22, "elapsed_time": "1 day, 2:34:33", "remaining_time": "1:02:43"}
723
+ {"current_steps": 3615, "total_steps": 3752, "loss": 0.1988, "lr": 1.646857882082853e-07, "epoch": 6.745098039215686, "percentage": 96.35, "elapsed_time": "1 day, 2:36:50", "remaining_time": "1:00:30"}
724
+ {"current_steps": 3620, "total_steps": 3752, "loss": 0.1981, "lr": 1.5298318864350738e-07, "epoch": 6.754435107376284, "percentage": 96.48, "elapsed_time": "1 day, 2:38:52", "remaining_time": "0:58:18"}
725
+ {"current_steps": 3625, "total_steps": 3752, "loss": 0.2008, "lr": 1.417102534398196e-07, "epoch": 6.763772175536881, "percentage": 96.62, "elapsed_time": "1 day, 2:41:03", "remaining_time": "0:56:05"}
726
+ {"current_steps": 3630, "total_steps": 3752, "loss": 0.1871, "lr": 1.3086722664288787e-07, "epoch": 6.773109243697479, "percentage": 96.75, "elapsed_time": "1 day, 2:43:27", "remaining_time": "0:53:53"}
727
+ {"current_steps": 3635, "total_steps": 3752, "loss": 0.2013, "lr": 1.2045434299137403e-07, "epoch": 6.7824463118580764, "percentage": 96.88, "elapsed_time": "1 day, 2:45:22", "remaining_time": "0:51:40"}
728
+ {"current_steps": 3640, "total_steps": 3752, "loss": 0.199, "lr": 1.1047182791185551e-07, "epoch": 6.791783380018674, "percentage": 97.01, "elapsed_time": "1 day, 2:47:27", "remaining_time": "0:49:27"}
729
+ {"current_steps": 3645, "total_steps": 3752, "loss": 0.2022, "lr": 1.0091989751393583e-07, "epoch": 6.8011204481792715, "percentage": 97.15, "elapsed_time": "1 day, 2:49:35", "remaining_time": "0:47:14"}
730
+ {"current_steps": 3650, "total_steps": 3752, "loss": 0.1971, "lr": 9.179875858557285e-08, "epoch": 6.810457516339869, "percentage": 97.28, "elapsed_time": "1 day, 2:51:46", "remaining_time": "0:45:02"}
731
+ {"current_steps": 3655, "total_steps": 3752, "loss": 0.2001, "lr": 8.310860858859793e-08, "epoch": 6.819794584500467, "percentage": 97.41, "elapsed_time": "1 day, 2:53:59", "remaining_time": "0:42:50"}
732
+ {"current_steps": 3660, "total_steps": 3752, "loss": 0.1893, "lr": 7.484963565444813e-08, "epoch": 6.829131652661064, "percentage": 97.55, "elapsed_time": "1 day, 2:56:20", "remaining_time": "0:40:37"}
733
+ {"current_steps": 3665, "total_steps": 3752, "loss": 0.201, "lr": 6.702201858008517e-08, "epoch": 6.838468720821662, "percentage": 97.68, "elapsed_time": "1 day, 2:58:17", "remaining_time": "0:38:24"}
734
+ {"current_steps": 3670, "total_steps": 3752, "loss": 0.1886, "lr": 5.962592682412948e-08, "epoch": 6.847805788982259, "percentage": 97.81, "elapsed_time": "1 day, 3:00:40", "remaining_time": "0:36:12"}
735
+ {"current_steps": 3675, "total_steps": 3752, "loss": 0.2023, "lr": 5.2661520503192176e-08, "epoch": 6.857142857142857, "percentage": 97.95, "elapsed_time": "1 day, 3:02:31", "remaining_time": "0:33:59"}
736
+ {"current_steps": 3680, "total_steps": 3752, "loss": 0.1944, "lr": 4.612895038840215e-08, "epoch": 6.866479925303455, "percentage": 98.08, "elapsed_time": "1 day, 3:04:31", "remaining_time": "0:31:47"}
737
+ {"current_steps": 3685, "total_steps": 3752, "loss": 0.1936, "lr": 4.0028357902153204e-08, "epoch": 6.875816993464053, "percentage": 98.21, "elapsed_time": "1 day, 3:06:52", "remaining_time": "0:29:34"}
738
+ {"current_steps": 3690, "total_steps": 3752, "loss": 0.1922, "lr": 3.435987511503314e-08, "epoch": 6.88515406162465, "percentage": 98.35, "elapsed_time": "1 day, 3:09:05", "remaining_time": "0:27:22"}
739
+ {"current_steps": 3695, "total_steps": 3752, "loss": 0.2045, "lr": 2.9123624742963818e-08, "epoch": 6.894491129785248, "percentage": 98.48, "elapsed_time": "1 day, 3:11:21", "remaining_time": "0:25:09"}
740
+ {"current_steps": 3700, "total_steps": 3752, "loss": 0.1931, "lr": 2.4319720144554417e-08, "epoch": 6.903828197945845, "percentage": 98.61, "elapsed_time": "1 day, 3:13:37", "remaining_time": "0:22:57"}
741
+ {"current_steps": 3705, "total_steps": 3752, "loss": 0.1893, "lr": 1.9948265318638915e-08, "epoch": 6.913165266106443, "percentage": 98.75, "elapsed_time": "1 day, 3:15:54", "remaining_time": "0:20:45"}
742
+ {"current_steps": 3710, "total_steps": 3752, "loss": 0.1926, "lr": 1.6009354902024598e-08, "epoch": 6.92250233426704, "percentage": 98.88, "elapsed_time": "1 day, 3:18:11", "remaining_time": "0:18:32"}
743
+ {"current_steps": 3715, "total_steps": 3752, "loss": 0.191, "lr": 1.2503074167451445e-08, "epoch": 6.931839402427638, "percentage": 99.01, "elapsed_time": "1 day, 3:20:28", "remaining_time": "0:16:20"}
744
+ {"current_steps": 3720, "total_steps": 3752, "loss": 0.2063, "lr": 9.429499021731403e-09, "epoch": 6.9411764705882355, "percentage": 99.15, "elapsed_time": "1 day, 3:22:44", "remaining_time": "0:14:07"}
745
+ {"current_steps": 3725, "total_steps": 3752, "loss": 0.2042, "lr": 6.788696004120798e-09, "epoch": 6.950513538748833, "percentage": 99.28, "elapsed_time": "1 day, 3:24:58", "remaining_time": "0:11:55"}
746
+ {"current_steps": 3730, "total_steps": 3752, "loss": 0.1949, "lr": 4.580722284872608e-09, "epoch": 6.959850606909431, "percentage": 99.41, "elapsed_time": "1 day, 3:27:10", "remaining_time": "0:09:42"}
747
+ {"current_steps": 3735, "total_steps": 3752, "loss": 0.1942, "lr": 2.8056256639974467e-09, "epoch": 6.969187675070028, "percentage": 99.55, "elapsed_time": "1 day, 3:29:43", "remaining_time": "0:07:30"}
748
+ {"current_steps": 3740, "total_steps": 3752, "loss": 0.1862, "lr": 1.4634445702288446e-09, "epoch": 6.978524743230626, "percentage": 99.68, "elapsed_time": "1 day, 3:32:09", "remaining_time": "0:05:18"}
749
+ {"current_steps": 3745, "total_steps": 3752, "loss": 0.1915, "lr": 5.542080601950161e-10, "epoch": 6.987861811391223, "percentage": 99.81, "elapsed_time": "1 day, 3:34:21", "remaining_time": "0:03:05"}
750
+ {"current_steps": 3750, "total_steps": 3752, "loss": 0.1889, "lr": 7.793581778825499e-11, "epoch": 6.997198879551821, "percentage": 99.95, "elapsed_time": "1 day, 3:36:27", "remaining_time": "0:00:53"}
751
+ {"current_steps": 3752, "total_steps": 3752, "epoch": 7.0, "percentage": 100.0, "elapsed_time": "1 day, 3:38:13", "remaining_time": "0:00:00"}