penfever commited on
Commit
fc5d318
·
verified ·
1 Parent(s): 3b6ae42

Training in progress, step 3800

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:482cc5bbcfbdc24dadc1955b963343c6fa11cd521417fc52347837df4854c27a
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:461a26270b93360f792b578d982413ab4e28c6f9eb422485b2712dc922ed8603
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54bffe58fa88cc85eafa08f906657f26f7c797817203e45e86ef70a6a0fbfc9b
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2b868cfe84306e00f4660350e09c06ba73117c117040106d5ab276f851d0431b
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9466a594f72c6ad6f81f55c996ce5b08030169f37b766f2eff557ffc0f955b8c
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:33599e4453c8e46c9f9ee06ead06bd62821c13d3b7037950ef5279c72589495a
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:801db55c2d69fd2bc9f19869bf87ba47a8a2600830a52ad88aa2c6724655ed26
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d53caea4b87fd44d5a2ae27b283a8c42631266713ead623a06f61113ebb95dc1
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -721,3 +721,40 @@
721
  {"current_steps": 3605, "total_steps": 4340, "loss": 0.4028, "lr": 3.4030746282742455e-06, "epoch": 5.814516129032258, "percentage": 83.06, "elapsed_time": "17:46:04", "remaining_time": "3:37:21"}
722
  {"current_steps": 3610, "total_steps": 4340, "loss": 0.4404, "lr": 3.3583296966594904e-06, "epoch": 5.82258064516129, "percentage": 83.18, "elapsed_time": "17:47:40", "remaining_time": "3:35:54"}
723
  {"current_steps": 3615, "total_steps": 4340, "loss": 0.4129, "lr": 3.313853900927679e-06, "epoch": 5.830645161290323, "percentage": 83.29, "elapsed_time": "17:49:24", "remaining_time": "3:34:28"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
721
  {"current_steps": 3605, "total_steps": 4340, "loss": 0.4028, "lr": 3.4030746282742455e-06, "epoch": 5.814516129032258, "percentage": 83.06, "elapsed_time": "17:46:04", "remaining_time": "3:37:21"}
722
  {"current_steps": 3610, "total_steps": 4340, "loss": 0.4404, "lr": 3.3583296966594904e-06, "epoch": 5.82258064516129, "percentage": 83.18, "elapsed_time": "17:47:40", "remaining_time": "3:35:54"}
723
  {"current_steps": 3615, "total_steps": 4340, "loss": 0.4129, "lr": 3.313853900927679e-06, "epoch": 5.830645161290323, "percentage": 83.29, "elapsed_time": "17:49:24", "remaining_time": "3:34:28"}
724
+ {"current_steps": 3620, "total_steps": 4340, "loss": 0.4305, "lr": 3.269647960359532e-06, "epoch": 5.838709677419355, "percentage": 83.41, "elapsed_time": "17:50:52", "remaining_time": "3:32:59"}
725
+ {"current_steps": 3625, "total_steps": 4340, "loss": 0.4072, "lr": 3.2257125898715547e-06, "epoch": 5.846774193548387, "percentage": 83.53, "elapsed_time": "17:52:11", "remaining_time": "3:31:28"}
726
+ {"current_steps": 3630, "total_steps": 4340, "loss": 0.4111, "lr": 3.1820485000044867e-06, "epoch": 5.854838709677419, "percentage": 83.64, "elapsed_time": "17:54:06", "remaining_time": "3:30:05"}
727
+ {"current_steps": 3635, "total_steps": 4340, "loss": 0.4306, "lr": 3.1386563969118076e-06, "epoch": 5.862903225806452, "percentage": 83.76, "elapsed_time": "17:55:37", "remaining_time": "3:28:36"}
728
+ {"current_steps": 3640, "total_steps": 4340, "loss": 0.4537, "lr": 3.0955369823483173e-06, "epoch": 5.870967741935484, "percentage": 83.87, "elapsed_time": "17:57:00", "remaining_time": "3:27:06"}
729
+ {"current_steps": 3645, "total_steps": 4340, "loss": 0.4118, "lr": 3.0526909536587813e-06, "epoch": 5.879032258064516, "percentage": 83.99, "elapsed_time": "17:58:20", "remaining_time": "3:25:36"}
730
+ {"current_steps": 3650, "total_steps": 4340, "loss": 0.4488, "lr": 3.010119003766665e-06, "epoch": 5.887096774193548, "percentage": 84.1, "elapsed_time": "17:59:35", "remaining_time": "3:24:05"}
731
+ {"current_steps": 3655, "total_steps": 4340, "loss": 0.4214, "lr": 2.967821821162904e-06, "epoch": 5.895161290322581, "percentage": 84.22, "elapsed_time": "18:01:05", "remaining_time": "3:22:36"}
732
+ {"current_steps": 3660, "total_steps": 4340, "loss": 0.4144, "lr": 2.925800089894801e-06, "epoch": 5.903225806451613, "percentage": 84.33, "elapsed_time": "18:02:21", "remaining_time": "3:21:05"}
733
+ {"current_steps": 3665, "total_steps": 4340, "loss": 0.4032, "lr": 2.8840544895549396e-06, "epoch": 5.911290322580645, "percentage": 84.45, "elapsed_time": "18:03:59", "remaining_time": "3:19:38"}
734
+ {"current_steps": 3670, "total_steps": 4340, "loss": 0.4201, "lr": 2.8425856952702103e-06, "epoch": 5.919354838709677, "percentage": 84.56, "elapsed_time": "18:05:22", "remaining_time": "3:18:08"}
735
+ {"current_steps": 3675, "total_steps": 4340, "loss": 0.4181, "lr": 2.801394377690865e-06, "epoch": 5.92741935483871, "percentage": 84.68, "elapsed_time": "18:06:51", "remaining_time": "3:16:40"}
736
+ {"current_steps": 3680, "total_steps": 4340, "loss": 0.4264, "lr": 2.7604812029797057e-06, "epoch": 5.935483870967742, "percentage": 84.79, "elapsed_time": "18:08:20", "remaining_time": "3:15:11"}
737
+ {"current_steps": 3685, "total_steps": 4340, "loss": 0.4291, "lr": 2.719846832801287e-06, "epoch": 5.943548387096774, "percentage": 84.91, "elapsed_time": "18:09:45", "remaining_time": "3:13:42"}
738
+ {"current_steps": 3690, "total_steps": 4340, "loss": 0.422, "lr": 2.679491924311226e-06, "epoch": 5.951612903225806, "percentage": 85.02, "elapsed_time": "18:11:04", "remaining_time": "3:12:11"}
739
+ {"current_steps": 3695, "total_steps": 4340, "loss": 0.3934, "lr": 2.6394171301455717e-06, "epoch": 5.959677419354839, "percentage": 85.14, "elapsed_time": "18:12:28", "remaining_time": "3:10:42"}
740
+ {"current_steps": 3700, "total_steps": 4340, "loss": 0.41, "lr": 2.599623098410251e-06, "epoch": 5.967741935483871, "percentage": 85.25, "elapsed_time": "18:13:53", "remaining_time": "3:09:12"}
741
+ {"current_steps": 3705, "total_steps": 4340, "loss": 0.4189, "lr": 2.5601104726705737e-06, "epoch": 5.975806451612903, "percentage": 85.37, "elapsed_time": "18:15:13", "remaining_time": "3:07:42"}
742
+ {"current_steps": 3710, "total_steps": 4340, "loss": 0.423, "lr": 2.5208798919408527e-06, "epoch": 5.983870967741936, "percentage": 85.48, "elapsed_time": "18:16:40", "remaining_time": "3:06:13"}
743
+ {"current_steps": 3715, "total_steps": 4340, "loss": 0.4503, "lr": 2.481931990674047e-06, "epoch": 5.991935483870968, "percentage": 85.6, "elapsed_time": "18:18:17", "remaining_time": "3:04:46"}
744
+ {"current_steps": 3720, "total_steps": 4340, "loss": 0.4172, "lr": 2.4432673987515123e-06, "epoch": 6.0, "percentage": 85.71, "elapsed_time": "18:19:46", "remaining_time": "3:03:17"}
745
+ {"current_steps": 3725, "total_steps": 4340, "loss": 0.4207, "lr": 2.4048867414728004e-06, "epoch": 6.008064516129032, "percentage": 85.83, "elapsed_time": "18:21:29", "remaining_time": "3:01:51"}
746
+ {"current_steps": 3730, "total_steps": 4340, "loss": 0.4152, "lr": 2.3667906395455663e-06, "epoch": 6.016129032258065, "percentage": 85.94, "elapsed_time": "18:23:12", "remaining_time": "3:00:25"}
747
+ {"current_steps": 3735, "total_steps": 4340, "loss": 0.4091, "lr": 2.328979709075516e-06, "epoch": 6.024193548387097, "percentage": 86.06, "elapsed_time": "18:24:32", "remaining_time": "2:58:54"}
748
+ {"current_steps": 3740, "total_steps": 4340, "loss": 0.4024, "lr": 2.2914545615564454e-06, "epoch": 6.032258064516129, "percentage": 86.18, "elapsed_time": "18:25:55", "remaining_time": "2:57:25"}
749
+ {"current_steps": 3745, "total_steps": 4340, "loss": 0.3903, "lr": 2.254215803860351e-06, "epoch": 6.040322580645161, "percentage": 86.29, "elapsed_time": "18:27:29", "remaining_time": "2:55:57"}
750
+ {"current_steps": 3750, "total_steps": 4340, "loss": 0.3975, "lr": 2.2172640382276267e-06, "epoch": 6.048387096774194, "percentage": 86.41, "elapsed_time": "18:28:57", "remaining_time": "2:54:28"}
751
+ {"current_steps": 3755, "total_steps": 4340, "loss": 0.4168, "lr": 2.180599862257291e-06, "epoch": 6.056451612903226, "percentage": 86.52, "elapsed_time": "18:30:14", "remaining_time": "2:52:57"}
752
+ {"current_steps": 3760, "total_steps": 4340, "loss": 0.3806, "lr": 2.1442238688973682e-06, "epoch": 6.064516129032258, "percentage": 86.64, "elapsed_time": "18:31:54", "remaining_time": "2:51:31"}
753
+ {"current_steps": 3765, "total_steps": 4340, "loss": 0.4079, "lr": 2.1081366464352614e-06, "epoch": 6.07258064516129, "percentage": 86.75, "elapsed_time": "18:33:15", "remaining_time": "2:50:01"}
754
+ {"current_steps": 3770, "total_steps": 4340, "loss": 0.3761, "lr": 2.0723387784882674e-06, "epoch": 6.080645161290323, "percentage": 86.87, "elapsed_time": "18:34:49", "remaining_time": "2:48:33"}
755
+ {"current_steps": 3775, "total_steps": 4340, "loss": 0.4026, "lr": 2.036830843994102e-06, "epoch": 6.088709677419355, "percentage": 86.98, "elapsed_time": "18:36:18", "remaining_time": "2:47:04"}
756
+ {"current_steps": 3780, "total_steps": 4340, "loss": 0.3791, "lr": 2.0016134172015755e-06, "epoch": 6.096774193548387, "percentage": 87.1, "elapsed_time": "18:37:48", "remaining_time": "2:45:36"}
757
+ {"current_steps": 3785, "total_steps": 4340, "loss": 0.4162, "lr": 1.9666870676612883e-06, "epoch": 6.104838709677419, "percentage": 87.21, "elapsed_time": "18:39:10", "remaining_time": "2:44:06"}
758
+ {"current_steps": 3790, "total_steps": 4340, "loss": 0.3942, "lr": 1.9320523602164145e-06, "epoch": 6.112903225806452, "percentage": 87.33, "elapsed_time": "18:40:37", "remaining_time": "2:42:37"}
759
+ {"current_steps": 3795, "total_steps": 4340, "loss": 0.3981, "lr": 1.8977098549935745e-06, "epoch": 6.120967741935484, "percentage": 87.44, "elapsed_time": "18:41:56", "remaining_time": "2:41:07"}
760
+ {"current_steps": 3800, "total_steps": 4340, "loss": 0.3854, "lr": 1.8636601073937855e-06, "epoch": 6.129032258064516, "percentage": 87.56, "elapsed_time": "18:43:15", "remaining_time": "2:39:37"}