penfever commited on
Commit
2b0b255
·
verified ·
1 Parent(s): a5dc658

Training in progress, step 4200

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:db2935fd1318902c4a052f0467c2e3e4c7aa51791601fe389c51e62b442e8fab
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed7cce06ee07229fbcc4622d2d0e097f1190f5b645121d87324e44835ba7a78c
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:977fa1a86b8ac74040c4c9f976af3d2a3525d0f982d7de11db6900846354295f
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3dcbf1835b3c5e01c8d58d794c2aaabadbc62d65657ef2a5080f1a86e8de4114
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6065ec1e5b9949cb07938e371dbdda05d05a8738933f473e3790bfc171e464f4
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b7364ca6b88e4c3f515e18a615b36f1347c71a1779366f0b6ba1dcc975abd307
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:274d378441b3c556d829cc65f798fe38a9eea4f78339e26cc05047c1c2a4e21c
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7dda4a4f93c431cdc75e5ffb7deb88ba7ee10fbbc8e66fd6ce38455d4d664732
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -798,3 +798,43 @@
798
  {"current_steps": 3990, "total_steps": 4340, "loss": 0.4159, "lr": 7.917046609134349e-07, "epoch": 6.435483870967742, "percentage": 91.94, "elapsed_time": "19:38:54", "remaining_time": "1:43:24"}
799
  {"current_steps": 3995, "total_steps": 4340, "loss": 0.3988, "lr": 7.694543588409353e-07, "epoch": 6.443548387096774, "percentage": 92.05, "elapsed_time": "19:40:22", "remaining_time": "1:41:56"}
800
  {"current_steps": 4000, "total_steps": 4340, "loss": 0.4034, "lr": 7.475150609997595e-07, "epoch": 6.451612903225806, "percentage": 92.17, "elapsed_time": "19:41:45", "remaining_time": "1:40:26"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
798
  {"current_steps": 3990, "total_steps": 4340, "loss": 0.4159, "lr": 7.917046609134349e-07, "epoch": 6.435483870967742, "percentage": 91.94, "elapsed_time": "19:38:54", "remaining_time": "1:43:24"}
799
  {"current_steps": 3995, "total_steps": 4340, "loss": 0.3988, "lr": 7.694543588409353e-07, "epoch": 6.443548387096774, "percentage": 92.05, "elapsed_time": "19:40:22", "remaining_time": "1:41:56"}
800
  {"current_steps": 4000, "total_steps": 4340, "loss": 0.4034, "lr": 7.475150609997595e-07, "epoch": 6.451612903225806, "percentage": 92.17, "elapsed_time": "19:41:45", "remaining_time": "1:40:26"}
801
+ {"current_steps": 4005, "total_steps": 4340, "loss": 0.3992, "lr": 7.258871222011832e-07, "epoch": 6.459677419354839, "percentage": 92.28, "elapsed_time": "19:45:32", "remaining_time": "1:39:09"}
802
+ {"current_steps": 4010, "total_steps": 4340, "loss": 0.408, "lr": 7.045708922210615e-07, "epoch": 6.467741935483871, "percentage": 92.4, "elapsed_time": "19:46:52", "remaining_time": "1:37:40"}
803
+ {"current_steps": 4015, "total_steps": 4340, "loss": 0.3973, "lr": 6.835667157941594e-07, "epoch": 6.475806451612903, "percentage": 92.51, "elapsed_time": "19:48:15", "remaining_time": "1:36:11"}
804
+ {"current_steps": 4020, "total_steps": 4340, "loss": 0.4175, "lr": 6.628749326085926e-07, "epoch": 6.483870967741936, "percentage": 92.63, "elapsed_time": "19:49:42", "remaining_time": "1:34:42"}
805
+ {"current_steps": 4025, "total_steps": 4340, "loss": 0.3904, "lr": 6.424958773003198e-07, "epoch": 6.491935483870968, "percentage": 92.74, "elapsed_time": "19:51:09", "remaining_time": "1:33:13"}
806
+ {"current_steps": 4030, "total_steps": 4340, "loss": 0.4108, "lr": 6.224298794477434e-07, "epoch": 6.5, "percentage": 92.86, "elapsed_time": "19:52:38", "remaining_time": "1:31:44"}
807
+ {"current_steps": 4035, "total_steps": 4340, "loss": 0.4106, "lr": 6.026772635663647e-07, "epoch": 6.508064516129032, "percentage": 92.97, "elapsed_time": "19:53:57", "remaining_time": "1:30:15"}
808
+ {"current_steps": 4040, "total_steps": 4340, "loss": 0.4045, "lr": 5.832383491035499e-07, "epoch": 6.516129032258064, "percentage": 93.09, "elapsed_time": "19:55:31", "remaining_time": "1:28:46"}
809
+ {"current_steps": 4045, "total_steps": 4340, "loss": 0.3993, "lr": 5.641134504333546e-07, "epoch": 6.524193548387097, "percentage": 93.2, "elapsed_time": "19:57:03", "remaining_time": "1:27:18"}
810
+ {"current_steps": 4050, "total_steps": 4340, "loss": 0.4128, "lr": 5.453028768514457e-07, "epoch": 6.532258064516129, "percentage": 93.32, "elapsed_time": "19:58:17", "remaining_time": "1:25:48"}
811
+ {"current_steps": 4055, "total_steps": 4340, "loss": 0.4039, "lr": 5.268069325700942e-07, "epoch": 6.540322580645161, "percentage": 93.43, "elapsed_time": "19:59:45", "remaining_time": "1:24:19"}
812
+ {"current_steps": 4060, "total_steps": 4340, "loss": 0.4197, "lr": 5.08625916713259e-07, "epoch": 6.548387096774194, "percentage": 93.55, "elapsed_time": "20:01:04", "remaining_time": "1:22:49"}
813
+ {"current_steps": 4065, "total_steps": 4340, "loss": 0.415, "lr": 4.907601233117465e-07, "epoch": 6.556451612903226, "percentage": 93.66, "elapsed_time": "20:02:21", "remaining_time": "1:21:20"}
814
+ {"current_steps": 4070, "total_steps": 4340, "loss": 0.3936, "lr": 4.732098412984565e-07, "epoch": 6.564516129032258, "percentage": 93.78, "elapsed_time": "20:03:41", "remaining_time": "1:19:51"}
815
+ {"current_steps": 4075, "total_steps": 4340, "loss": 0.409, "lr": 4.559753545037171e-07, "epoch": 6.57258064516129, "percentage": 93.89, "elapsed_time": "20:05:17", "remaining_time": "1:18:22"}
816
+ {"current_steps": 4080, "total_steps": 4340, "loss": 0.3983, "lr": 4.3905694165067735e-07, "epoch": 6.580645161290323, "percentage": 94.01, "elapsed_time": "20:06:54", "remaining_time": "1:16:54"}
817
+ {"current_steps": 4085, "total_steps": 4340, "loss": 0.407, "lr": 4.2245487635081075e-07, "epoch": 6.588709677419355, "percentage": 94.12, "elapsed_time": "20:08:45", "remaining_time": "1:15:27"}
818
+ {"current_steps": 4090, "total_steps": 4340, "loss": 0.3993, "lr": 4.061694270994965e-07, "epoch": 6.596774193548387, "percentage": 94.24, "elapsed_time": "20:10:18", "remaining_time": "1:13:58"}
819
+ {"current_steps": 4095, "total_steps": 4340, "loss": 0.405, "lr": 3.9020085727166536e-07, "epoch": 6.604838709677419, "percentage": 94.35, "elapsed_time": "20:11:48", "remaining_time": "1:12:30"}
820
+ {"current_steps": 4100, "total_steps": 4340, "loss": 0.4104, "lr": 3.74549425117543e-07, "epoch": 6.612903225806452, "percentage": 94.47, "elapsed_time": "20:13:11", "remaining_time": "1:11:00"}
821
+ {"current_steps": 4105, "total_steps": 4340, "loss": 0.4106, "lr": 3.5921538375847776e-07, "epoch": 6.620967741935484, "percentage": 94.59, "elapsed_time": "20:14:27", "remaining_time": "1:09:31"}
822
+ {"current_steps": 4110, "total_steps": 4340, "loss": 0.4006, "lr": 3.441989811828417e-07, "epoch": 6.629032258064516, "percentage": 94.7, "elapsed_time": "20:15:56", "remaining_time": "1:08:02"}
823
+ {"current_steps": 4115, "total_steps": 4340, "loss": 0.4191, "lr": 3.2950046024202485e-07, "epoch": 6.637096774193548, "percentage": 94.82, "elapsed_time": "20:17:20", "remaining_time": "1:06:33"}
824
+ {"current_steps": 4120, "total_steps": 4340, "loss": 0.3765, "lr": 3.1512005864650973e-07, "epoch": 6.645161290322581, "percentage": 94.93, "elapsed_time": "20:19:07", "remaining_time": "1:05:05"}
825
+ {"current_steps": 4125, "total_steps": 4340, "loss": 0.4007, "lr": 3.010580089620163e-07, "epoch": 6.653225806451613, "percentage": 95.05, "elapsed_time": "20:20:33", "remaining_time": "1:03:37"}
826
+ {"current_steps": 4130, "total_steps": 4340, "loss": 0.4376, "lr": 2.8731453860575185e-07, "epoch": 6.661290322580645, "percentage": 95.16, "elapsed_time": "20:21:54", "remaining_time": "1:02:07"}
827
+ {"current_steps": 4135, "total_steps": 4340, "loss": 0.4097, "lr": 2.738898698427228e-07, "epoch": 6.669354838709677, "percentage": 95.28, "elapsed_time": "20:23:14", "remaining_time": "1:00:38"}
828
+ {"current_steps": 4140, "total_steps": 4340, "loss": 0.4054, "lr": 2.607842197821553e-07, "epoch": 6.67741935483871, "percentage": 95.39, "elapsed_time": "20:24:39", "remaining_time": "0:59:09"}
829
+ {"current_steps": 4145, "total_steps": 4340, "loss": 0.3984, "lr": 2.479978003739669e-07, "epoch": 6.685483870967742, "percentage": 95.51, "elapsed_time": "20:26:14", "remaining_time": "0:57:41"}
830
+ {"current_steps": 4150, "total_steps": 4340, "loss": 0.3899, "lr": 2.3553081840535396e-07, "epoch": 6.693548387096774, "percentage": 95.62, "elapsed_time": "20:27:41", "remaining_time": "0:56:12"}
831
+ {"current_steps": 4155, "total_steps": 4340, "loss": 0.4066, "lr": 2.2338347549742956e-07, "epoch": 6.701612903225806, "percentage": 95.74, "elapsed_time": "20:29:05", "remaining_time": "0:54:43"}
832
+ {"current_steps": 4160, "total_steps": 4340, "loss": 0.401, "lr": 2.115559681019863e-07, "epoch": 6.709677419354839, "percentage": 95.85, "elapsed_time": "20:30:34", "remaining_time": "0:53:14"}
833
+ {"current_steps": 4165, "total_steps": 4340, "loss": 0.4014, "lr": 2.0004848749829663e-07, "epoch": 6.717741935483871, "percentage": 95.97, "elapsed_time": "20:31:51", "remaining_time": "0:51:45"}
834
+ {"current_steps": 4170, "total_steps": 4340, "loss": 0.3828, "lr": 1.8886121979003302e-07, "epoch": 6.725806451612903, "percentage": 96.08, "elapsed_time": "20:33:12", "remaining_time": "0:50:16"}
835
+ {"current_steps": 4175, "total_steps": 4340, "loss": 0.4244, "lr": 1.7799434590225484e-07, "epoch": 6.733870967741936, "percentage": 96.2, "elapsed_time": "20:35:02", "remaining_time": "0:48:48"}
836
+ {"current_steps": 4180, "total_steps": 4340, "loss": 0.4074, "lr": 1.6744804157848183e-07, "epoch": 6.741935483870968, "percentage": 96.31, "elapsed_time": "20:36:27", "remaining_time": "0:47:19"}
837
+ {"current_steps": 4185, "total_steps": 4340, "loss": 0.4039, "lr": 1.5722247737784968e-07, "epoch": 6.75, "percentage": 96.43, "elapsed_time": "20:38:02", "remaining_time": "0:45:51"}
838
+ {"current_steps": 4190, "total_steps": 4340, "loss": 0.4022, "lr": 1.473178186723545e-07, "epoch": 6.758064516129032, "percentage": 96.54, "elapsed_time": "20:39:28", "remaining_time": "0:44:22"}
839
+ {"current_steps": 4195, "total_steps": 4340, "loss": 0.4031, "lr": 1.3773422564417939e-07, "epoch": 6.766129032258064, "percentage": 96.66, "elapsed_time": "20:40:52", "remaining_time": "0:42:53"}
840
+ {"current_steps": 4200, "total_steps": 4340, "loss": 0.3839, "lr": 1.2847185328310087e-07, "epoch": 6.774193548387097, "percentage": 96.77, "elapsed_time": "20:42:10", "remaining_time": "0:41:24"}