penfever commited on
Commit
a5dc658
·
verified ·
1 Parent(s): fc5d318

Training in progress, step 4000

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:461a26270b93360f792b578d982413ab4e28c6f9eb422485b2712dc922ed8603
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db2935fd1318902c4a052f0467c2e3e4c7aa51791601fe389c51e62b442e8fab
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2b868cfe84306e00f4660350e09c06ba73117c117040106d5ab276f851d0431b
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:977fa1a86b8ac74040c4c9f976af3d2a3525d0f982d7de11db6900846354295f
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33599e4453c8e46c9f9ee06ead06bd62821c13d3b7037950ef5279c72589495a
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6065ec1e5b9949cb07938e371dbdda05d05a8738933f473e3790bfc171e464f4
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d53caea4b87fd44d5a2ae27b283a8c42631266713ead623a06f61113ebb95dc1
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:274d378441b3c556d829cc65f798fe38a9eea4f78339e26cc05047c1c2a4e21c
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -758,3 +758,43 @@
758
  {"current_steps": 3790, "total_steps": 4340, "loss": 0.3942, "lr": 1.9320523602164145e-06, "epoch": 6.112903225806452, "percentage": 87.33, "elapsed_time": "18:40:37", "remaining_time": "2:42:37"}
759
  {"current_steps": 3795, "total_steps": 4340, "loss": 0.3981, "lr": 1.8977098549935745e-06, "epoch": 6.120967741935484, "percentage": 87.44, "elapsed_time": "18:41:56", "remaining_time": "2:41:07"}
760
  {"current_steps": 3800, "total_steps": 4340, "loss": 0.3854, "lr": 1.8636601073937855e-06, "epoch": 6.129032258064516, "percentage": 87.56, "elapsed_time": "18:43:15", "remaining_time": "2:39:37"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
758
  {"current_steps": 3790, "total_steps": 4340, "loss": 0.3942, "lr": 1.9320523602164145e-06, "epoch": 6.112903225806452, "percentage": 87.33, "elapsed_time": "18:40:37", "remaining_time": "2:42:37"}
759
  {"current_steps": 3795, "total_steps": 4340, "loss": 0.3981, "lr": 1.8977098549935745e-06, "epoch": 6.120967741935484, "percentage": 87.44, "elapsed_time": "18:41:56", "remaining_time": "2:41:07"}
760
  {"current_steps": 3800, "total_steps": 4340, "loss": 0.3854, "lr": 1.8636601073937855e-06, "epoch": 6.129032258064516, "percentage": 87.56, "elapsed_time": "18:43:15", "remaining_time": "2:39:37"}
761
+ {"current_steps": 3805, "total_steps": 4340, "loss": 0.4063, "lr": 1.8299036680834459e-06, "epoch": 6.137096774193548, "percentage": 87.67, "elapsed_time": "18:46:13", "remaining_time": "2:38:21"}
762
+ {"current_steps": 3810, "total_steps": 4340, "loss": 0.4216, "lr": 1.796441082985476e-06, "epoch": 6.145161290322581, "percentage": 87.79, "elapsed_time": "18:47:30", "remaining_time": "2:36:50"}
763
+ {"current_steps": 3815, "total_steps": 4340, "loss": 0.3907, "lr": 1.763272893270458e-06, "epoch": 6.153225806451613, "percentage": 87.9, "elapsed_time": "18:49:01", "remaining_time": "2:35:22"}
764
+ {"current_steps": 3820, "total_steps": 4340, "loss": 0.4245, "lr": 1.7303996353478837e-06, "epoch": 6.161290322580645, "percentage": 88.02, "elapsed_time": "18:50:20", "remaining_time": "2:33:52"}
765
+ {"current_steps": 3825, "total_steps": 4340, "loss": 0.402, "lr": 1.6978218408574943e-06, "epoch": 6.169354838709677, "percentage": 88.13, "elapsed_time": "18:51:52", "remaining_time": "2:32:23"}
766
+ {"current_steps": 3830, "total_steps": 4340, "loss": 0.3877, "lr": 1.6655400366606867e-06, "epoch": 6.17741935483871, "percentage": 88.25, "elapsed_time": "18:53:13", "remaining_time": "2:30:53"}
767
+ {"current_steps": 3835, "total_steps": 4340, "loss": 0.3828, "lr": 1.6335547448319622e-06, "epoch": 6.185483870967742, "percentage": 88.36, "elapsed_time": "18:54:43", "remaining_time": "2:29:25"}
768
+ {"current_steps": 3840, "total_steps": 4340, "loss": 0.4247, "lr": 1.6018664826505114e-06, "epoch": 6.193548387096774, "percentage": 88.48, "elapsed_time": "18:55:53", "remaining_time": "2:27:54"}
769
+ {"current_steps": 3845, "total_steps": 4340, "loss": 0.4036, "lr": 1.5704757625918454e-06, "epoch": 6.201612903225806, "percentage": 88.59, "elapsed_time": "18:57:12", "remaining_time": "2:26:24"}
770
+ {"current_steps": 3850, "total_steps": 4340, "loss": 0.3976, "lr": 1.539383092319502e-06, "epoch": 6.209677419354839, "percentage": 88.71, "elapsed_time": "18:58:44", "remaining_time": "2:24:55"}
771
+ {"current_steps": 3855, "total_steps": 4340, "loss": 0.4257, "lr": 1.5085889746768211e-06, "epoch": 6.217741935483871, "percentage": 88.82, "elapsed_time": "19:00:07", "remaining_time": "2:23:26"}
772
+ {"current_steps": 3860, "total_steps": 4340, "loss": 0.3887, "lr": 1.478093907678848e-06, "epoch": 6.225806451612903, "percentage": 88.94, "elapsed_time": "19:01:37", "remaining_time": "2:21:57"}
773
+ {"current_steps": 3865, "total_steps": 4340, "loss": 0.3999, "lr": 1.4478983845042493e-06, "epoch": 6.233870967741935, "percentage": 89.06, "elapsed_time": "19:03:11", "remaining_time": "2:20:29"}
774
+ {"current_steps": 3870, "total_steps": 4340, "loss": 0.3886, "lr": 1.4180028934873402e-06, "epoch": 6.241935483870968, "percentage": 89.17, "elapsed_time": "19:04:27", "remaining_time": "2:18:59"}
775
+ {"current_steps": 3875, "total_steps": 4340, "loss": 0.4086, "lr": 1.3884079181102062e-06, "epoch": 6.25, "percentage": 89.29, "elapsed_time": "19:05:58", "remaining_time": "2:17:30"}
776
+ {"current_steps": 3880, "total_steps": 4340, "loss": 0.4153, "lr": 1.3591139369948692e-06, "epoch": 6.258064516129032, "percentage": 89.4, "elapsed_time": "19:07:20", "remaining_time": "2:16:01"}
777
+ {"current_steps": 3885, "total_steps": 4340, "loss": 0.3946, "lr": 1.3301214238955384e-06, "epoch": 6.266129032258064, "percentage": 89.52, "elapsed_time": "19:08:38", "remaining_time": "2:14:31"}
778
+ {"current_steps": 3890, "total_steps": 4340, "loss": 0.3823, "lr": 1.3014308476909698e-06, "epoch": 6.274193548387097, "percentage": 89.63, "elapsed_time": "19:09:57", "remaining_time": "2:13:01"}
779
+ {"current_steps": 3895, "total_steps": 4340, "loss": 0.4207, "lr": 1.2730426723768673e-06, "epoch": 6.282258064516129, "percentage": 89.75, "elapsed_time": "19:11:15", "remaining_time": "2:11:31"}
780
+ {"current_steps": 3900, "total_steps": 4340, "loss": 0.3986, "lr": 1.244957357058394e-06, "epoch": 6.290322580645161, "percentage": 89.86, "elapsed_time": "19:12:41", "remaining_time": "2:10:02"}
781
+ {"current_steps": 3905, "total_steps": 4340, "loss": 0.4153, "lr": 1.2171753559427168e-06, "epoch": 6.298387096774194, "percentage": 89.98, "elapsed_time": "19:14:05", "remaining_time": "2:08:33"}
782
+ {"current_steps": 3910, "total_steps": 4340, "loss": 0.4061, "lr": 1.189697118331703e-06, "epoch": 6.306451612903226, "percentage": 90.09, "elapsed_time": "19:15:29", "remaining_time": "2:07:04"}
783
+ {"current_steps": 3915, "total_steps": 4340, "loss": 0.3981, "lr": 1.1625230886146245e-06, "epoch": 6.314516129032258, "percentage": 90.21, "elapsed_time": "19:16:51", "remaining_time": "2:05:35"}
784
+ {"current_steps": 3920, "total_steps": 4340, "loss": 0.4337, "lr": 1.1356537062609706e-06, "epoch": 6.32258064516129, "percentage": 90.32, "elapsed_time": "19:18:25", "remaining_time": "2:04:07"}
785
+ {"current_steps": 3925, "total_steps": 4340, "loss": 0.4229, "lr": 1.109089405813366e-06, "epoch": 6.330645161290323, "percentage": 90.44, "elapsed_time": "19:19:43", "remaining_time": "2:02:37"}
786
+ {"current_steps": 3930, "total_steps": 4340, "loss": 0.4088, "lr": 1.0828306168805148e-06, "epoch": 6.338709677419355, "percentage": 90.55, "elapsed_time": "19:21:01", "remaining_time": "2:01:07"}
787
+ {"current_steps": 3935, "total_steps": 4340, "loss": 0.4003, "lr": 1.0568777641302663e-06, "epoch": 6.346774193548387, "percentage": 90.67, "elapsed_time": "19:22:38", "remaining_time": "1:59:39"}
788
+ {"current_steps": 3940, "total_steps": 4340, "loss": 0.4068, "lr": 1.0312312672827417e-06, "epoch": 6.354838709677419, "percentage": 90.78, "elapsed_time": "19:24:02", "remaining_time": "1:58:10"}
789
+ {"current_steps": 3945, "total_steps": 4340, "loss": 0.4069, "lr": 1.0058915411035586e-06, "epoch": 6.362903225806452, "percentage": 90.9, "elapsed_time": "19:25:38", "remaining_time": "1:56:42"}
790
+ {"current_steps": 3950, "total_steps": 4340, "loss": 0.4111, "lr": 9.808589953971092e-07, "epoch": 6.370967741935484, "percentage": 91.01, "elapsed_time": "19:27:03", "remaining_time": "1:55:13"}
791
+ {"current_steps": 3955, "total_steps": 4340, "loss": 0.4014, "lr": 9.561340349999315e-07, "epoch": 6.379032258064516, "percentage": 91.13, "elapsed_time": "19:28:25", "remaining_time": "1:53:44"}
792
+ {"current_steps": 3960, "total_steps": 4340, "loss": 0.4091, "lr": 9.317170597741798e-07, "epoch": 6.387096774193548, "percentage": 91.24, "elapsed_time": "19:29:55", "remaining_time": "1:52:15"}
793
+ {"current_steps": 3965, "total_steps": 4340, "loss": 0.3971, "lr": 9.076084646011418e-07, "epoch": 6.395161290322581, "percentage": 91.36, "elapsed_time": "19:31:41", "remaining_time": "1:50:48"}
794
+ {"current_steps": 3970, "total_steps": 4340, "loss": 0.4087, "lr": 8.83808639374848e-07, "epoch": 6.403225806451613, "percentage": 91.47, "elapsed_time": "19:33:06", "remaining_time": "1:49:19"}
795
+ {"current_steps": 3975, "total_steps": 4340, "loss": 0.3997, "lr": 8.60317968995792e-07, "epoch": 6.411290322580645, "percentage": 91.59, "elapsed_time": "19:34:26", "remaining_time": "1:47:50"}
796
+ {"current_steps": 3980, "total_steps": 4340, "loss": 0.4111, "lr": 8.371368333646823e-07, "epoch": 6.419354838709677, "percentage": 91.71, "elapsed_time": "19:36:06", "remaining_time": "1:46:22"}
797
+ {"current_steps": 3985, "total_steps": 4340, "loss": 0.4208, "lr": 8.142656073762944e-07, "epoch": 6.42741935483871, "percentage": 91.82, "elapsed_time": "19:37:27", "remaining_time": "1:44:53"}
798
+ {"current_steps": 3990, "total_steps": 4340, "loss": 0.4159, "lr": 7.917046609134349e-07, "epoch": 6.435483870967742, "percentage": 91.94, "elapsed_time": "19:38:54", "remaining_time": "1:43:24"}
799
+ {"current_steps": 3995, "total_steps": 4340, "loss": 0.3988, "lr": 7.694543588409353e-07, "epoch": 6.443548387096774, "percentage": 92.05, "elapsed_time": "19:40:22", "remaining_time": "1:41:56"}
800
+ {"current_steps": 4000, "total_steps": 4340, "loss": 0.4034, "lr": 7.475150609997595e-07, "epoch": 6.451612903225806, "percentage": 92.17, "elapsed_time": "19:41:45", "remaining_time": "1:40:26"}