penfever commited on
Commit
1453de1
·
verified ·
1 Parent(s): a6edd1c

Training in progress, step 5200

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f295043e862bfc43941b52818ed957acadb915a5b77b1f242b5b9cfba576a963
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03ef76a6ba267115adecbd717ed5b6c3d1a42e94d2558a3d9596b02f28e38b3c
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f198a7013444abd027674a0fa3316dd45bdecc853249dd43fd90f7126232dd9c
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f2fc4496cfe38a75c60ffb6da8f9225b1f65b83fd22a1a181fbfdd4c2907ab4
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ef60c579a98ae7b1c2a662ae65d7b064e89ae41226043766fdf4ff225913da88
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:476c07cfbbd73d3f8ffdde332a82f1934f1c8a631e8544a01626c42b66f65380
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:044d403b950c44e6a0e078ffb7217b9a6db825ce1cd485d56c9040b4ad533f93
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d335eb82c918d4e2523a9aa3f1a0cb3410ecc07e5e425bb972b26bc765ba0f5
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -1001,3 +1001,44 @@
1001
  {"current_steps": 4995, "total_steps": 6188, "loss": 0.0625, "lr": 4.367893544535757e-06, "epoch": 5.65195246179966, "percentage": 80.72, "elapsed_time": "14:52:40", "remaining_time": "3:33:12"}
1002
  {"current_steps": 5000, "total_steps": 6188, "loss": 0.0615, "lr": 4.332767381597575e-06, "epoch": 5.657611771363894, "percentage": 80.8, "elapsed_time": "14:54:11", "remaining_time": "3:32:27"}
1003
  {"current_steps": 5005, "total_steps": 6188, "loss": 0.0647, "lr": 4.297765864365453e-06, "epoch": 5.663271080928126, "percentage": 80.88, "elapsed_time": "14:57:02", "remaining_time": "3:32:01"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1001
  {"current_steps": 4995, "total_steps": 6188, "loss": 0.0625, "lr": 4.367893544535757e-06, "epoch": 5.65195246179966, "percentage": 80.72, "elapsed_time": "14:52:40", "remaining_time": "3:33:12"}
1002
  {"current_steps": 5000, "total_steps": 6188, "loss": 0.0615, "lr": 4.332767381597575e-06, "epoch": 5.657611771363894, "percentage": 80.8, "elapsed_time": "14:54:11", "remaining_time": "3:32:27"}
1003
  {"current_steps": 5005, "total_steps": 6188, "loss": 0.0647, "lr": 4.297765864365453e-06, "epoch": 5.663271080928126, "percentage": 80.88, "elapsed_time": "14:57:02", "remaining_time": "3:32:01"}
1004
+ {"current_steps": 5010, "total_steps": 6188, "loss": 0.1096, "lr": 4.262889271305204e-06, "epoch": 5.66893039049236, "percentage": 80.96, "elapsed_time": "14:59:18", "remaining_time": "3:31:27"}
1005
+ {"current_steps": 5015, "total_steps": 6188, "loss": 0.0926, "lr": 4.228137879888774e-06, "epoch": 5.674589700056593, "percentage": 81.04, "elapsed_time": "15:01:07", "remaining_time": "3:30:46"}
1006
+ {"current_steps": 5020, "total_steps": 6188, "loss": 0.0755, "lr": 4.193511966592041e-06, "epoch": 5.680249009620827, "percentage": 81.12, "elapsed_time": "15:02:40", "remaining_time": "3:30:01"}
1007
+ {"current_steps": 5025, "total_steps": 6188, "loss": 0.0911, "lr": 4.1590118068925815e-06, "epoch": 5.685908319185059, "percentage": 81.21, "elapsed_time": "15:04:22", "remaining_time": "3:29:18"}
1008
+ {"current_steps": 5030, "total_steps": 6188, "loss": 0.1086, "lr": 4.124637675267511e-06, "epoch": 5.691567628749293, "percentage": 81.29, "elapsed_time": "15:06:13", "remaining_time": "3:28:37"}
1009
+ {"current_steps": 5035, "total_steps": 6188, "loss": 0.0774, "lr": 4.090389845191278e-06, "epoch": 5.697226938313526, "percentage": 81.37, "elapsed_time": "15:07:47", "remaining_time": "3:27:52"}
1010
+ {"current_steps": 5040, "total_steps": 6188, "loss": 0.095, "lr": 4.056268589133516e-06, "epoch": 5.702886247877759, "percentage": 81.45, "elapsed_time": "15:09:23", "remaining_time": "3:27:08"}
1011
+ {"current_steps": 5045, "total_steps": 6188, "loss": 0.0772, "lr": 4.022274178556844e-06, "epoch": 5.708545557441992, "percentage": 81.53, "elapsed_time": "15:10:59", "remaining_time": "3:26:23"}
1012
+ {"current_steps": 5050, "total_steps": 6188, "loss": 0.0696, "lr": 3.988406883914717e-06, "epoch": 5.7142048670062255, "percentage": 81.61, "elapsed_time": "15:12:47", "remaining_time": "3:25:41"}
1013
+ {"current_steps": 5055, "total_steps": 6188, "loss": 0.076, "lr": 3.954666974649295e-06, "epoch": 5.719864176570458, "percentage": 81.69, "elapsed_time": "15:14:49", "remaining_time": "3:25:02"}
1014
+ {"current_steps": 5060, "total_steps": 6188, "loss": 0.0679, "lr": 3.921054719189272e-06, "epoch": 5.7255234861346915, "percentage": 81.77, "elapsed_time": "15:16:48", "remaining_time": "3:24:22"}
1015
+ {"current_steps": 5065, "total_steps": 6188, "loss": 0.0657, "lr": 3.887570384947745e-06, "epoch": 5.731182795698925, "percentage": 81.85, "elapsed_time": "15:18:27", "remaining_time": "3:23:38"}
1016
+ {"current_steps": 5070, "total_steps": 6188, "loss": 0.0783, "lr": 3.854214238320109e-06, "epoch": 5.7368421052631575, "percentage": 81.93, "elapsed_time": "15:20:21", "remaining_time": "3:22:57"}
1017
+ {"current_steps": 5075, "total_steps": 6188, "loss": 0.0818, "lr": 3.8209865446819105e-06, "epoch": 5.742501414827391, "percentage": 82.01, "elapsed_time": "15:22:20", "remaining_time": "3:22:16"}
1018
+ {"current_steps": 5080, "total_steps": 6188, "loss": 0.0845, "lr": 3.7878875683867476e-06, "epoch": 5.748160724391624, "percentage": 82.09, "elapsed_time": "15:23:55", "remaining_time": "3:21:30"}
1019
+ {"current_steps": 5085, "total_steps": 6188, "loss": 0.0697, "lr": 3.7549175727641606e-06, "epoch": 5.753820033955858, "percentage": 82.18, "elapsed_time": "15:25:34", "remaining_time": "3:20:46"}
1020
+ {"current_steps": 5090, "total_steps": 6188, "loss": 0.0718, "lr": 3.7220768201175615e-06, "epoch": 5.75947934352009, "percentage": 82.26, "elapsed_time": "15:27:13", "remaining_time": "3:20:01"}
1021
+ {"current_steps": 5095, "total_steps": 6188, "loss": 0.0798, "lr": 3.689365571722112e-06, "epoch": 5.765138653084324, "percentage": 82.34, "elapsed_time": "15:29:00", "remaining_time": "3:19:17"}
1022
+ {"current_steps": 5100, "total_steps": 6188, "loss": 0.0592, "lr": 3.6567840878226577e-06, "epoch": 5.770797962648556, "percentage": 82.42, "elapsed_time": "15:30:34", "remaining_time": "3:18:31"}
1023
+ {"current_steps": 5105, "total_steps": 6188, "loss": 0.0763, "lr": 3.624332627631679e-06, "epoch": 5.77645727221279, "percentage": 82.5, "elapsed_time": "15:32:08", "remaining_time": "3:17:44"}
1024
+ {"current_steps": 5110, "total_steps": 6188, "loss": 0.0745, "lr": 3.5920114493271974e-06, "epoch": 5.782116581777023, "percentage": 82.58, "elapsed_time": "15:33:47", "remaining_time": "3:16:59"}
1025
+ {"current_steps": 5115, "total_steps": 6188, "loss": 0.0847, "lr": 3.5598208100507314e-06, "epoch": 5.787775891341257, "percentage": 82.66, "elapsed_time": "15:35:33", "remaining_time": "3:16:15"}
1026
+ {"current_steps": 5120, "total_steps": 6188, "loss": 0.0754, "lr": 3.5277609659052712e-06, "epoch": 5.793435200905489, "percentage": 82.74, "elapsed_time": "15:37:16", "remaining_time": "3:15:30"}
1027
+ {"current_steps": 5125, "total_steps": 6188, "loss": 0.0807, "lr": 3.4958321719532106e-06, "epoch": 5.799094510469723, "percentage": 82.82, "elapsed_time": "15:38:45", "remaining_time": "3:14:42"}
1028
+ {"current_steps": 5130, "total_steps": 6188, "loss": 0.0763, "lr": 3.4640346822143324e-06, "epoch": 5.804753820033956, "percentage": 82.9, "elapsed_time": "15:40:34", "remaining_time": "3:13:58"}
1029
+ {"current_steps": 5135, "total_steps": 6188, "loss": 0.0834, "lr": 3.4323687496637837e-06, "epoch": 5.810413129598189, "percentage": 82.98, "elapsed_time": "15:42:18", "remaining_time": "3:13:13"}
1030
+ {"current_steps": 5140, "total_steps": 6188, "loss": 0.0748, "lr": 3.4008346262300852e-06, "epoch": 5.816072439162422, "percentage": 83.06, "elapsed_time": "15:43:55", "remaining_time": "3:12:27"}
1031
+ {"current_steps": 5145, "total_steps": 6188, "loss": 0.0674, "lr": 3.3694325627930846e-06, "epoch": 5.8217317487266556, "percentage": 83.14, "elapsed_time": "15:45:23", "remaining_time": "3:11:38"}
1032
+ {"current_steps": 5150, "total_steps": 6188, "loss": 0.0877, "lr": 3.3381628091819907e-06, "epoch": 5.827391058290889, "percentage": 83.23, "elapsed_time": "15:47:22", "remaining_time": "3:10:56"}
1033
+ {"current_steps": 5155, "total_steps": 6188, "loss": 0.0668, "lr": 3.3070256141733913e-06, "epoch": 5.8330503678551215, "percentage": 83.31, "elapsed_time": "15:49:00", "remaining_time": "3:10:10"}
1034
+ {"current_steps": 5160, "total_steps": 6188, "loss": 0.0663, "lr": 3.2760212254892453e-06, "epoch": 5.838709677419355, "percentage": 83.39, "elapsed_time": "15:50:48", "remaining_time": "3:09:25"}
1035
+ {"current_steps": 5165, "total_steps": 6188, "loss": 0.0755, "lr": 3.245149889794932e-06, "epoch": 5.8443689869835875, "percentage": 83.47, "elapsed_time": "15:52:38", "remaining_time": "3:08:41"}
1036
+ {"current_steps": 5170, "total_steps": 6188, "loss": 0.0609, "lr": 3.2144118526972943e-06, "epoch": 5.850028296547821, "percentage": 83.55, "elapsed_time": "15:54:18", "remaining_time": "3:07:54"}
1037
+ {"current_steps": 5175, "total_steps": 6188, "loss": 0.0612, "lr": 3.1838073587426676e-06, "epoch": 5.855687606112054, "percentage": 83.63, "elapsed_time": "15:55:54", "remaining_time": "3:07:06"}
1038
+ {"current_steps": 5180, "total_steps": 6188, "loss": 0.079, "lr": 3.153336651414933e-06, "epoch": 5.861346915676288, "percentage": 83.71, "elapsed_time": "15:57:34", "remaining_time": "3:06:20"}
1039
+ {"current_steps": 5185, "total_steps": 6188, "loss": 0.0941, "lr": 3.1229999731336137e-06, "epoch": 5.86700622524052, "percentage": 83.79, "elapsed_time": "15:59:25", "remaining_time": "3:05:35"}
1040
+ {"current_steps": 5190, "total_steps": 6188, "loss": 0.0713, "lr": 3.0927975652518994e-06, "epoch": 5.872665534804754, "percentage": 83.87, "elapsed_time": "16:01:00", "remaining_time": "3:04:47"}
1041
+ {"current_steps": 5195, "total_steps": 6188, "loss": 0.0797, "lr": 3.062729668054756e-06, "epoch": 5.878324844368987, "percentage": 83.95, "elapsed_time": "16:02:37", "remaining_time": "3:04:00"}
1042
+ {"current_steps": 5200, "total_steps": 6188, "loss": 0.0904, "lr": 3.032796520757002e-06, "epoch": 5.88398415393322, "percentage": 84.03, "elapsed_time": "16:04:12", "remaining_time": "3:03:11"}
1043
+ {"current_steps": 5205, "total_steps": 6188, "loss": 0.0683, "lr": 3.0029983615014234e-06, "epoch": 5.889643463497453, "percentage": 84.11, "elapsed_time": "16:06:55", "remaining_time": "3:02:36"}
1044
+ {"current_steps": 5210, "total_steps": 6188, "loss": 0.0739, "lr": 2.9733354273568514e-06, "epoch": 5.895302773061687, "percentage": 84.2, "elapsed_time": "16:08:29", "remaining_time": "3:01:48"}