penfever commited on
Commit
5829717
·
verified ·
1 Parent(s): 7cdb8d4

Training in progress, step 4600

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f5e23115707566cc6e06829d64d21eae00a89a1c471f9e734393096561787aa5
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:efc0f1af468e1e5430a1a05c06b56a8498196657df5df1f5aa9aa5818216c4da
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:951457c8682581414683c4b8e11bc1d81ffab7ac282fec1aa3e9333b6f44e4a7
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fca68e979031a70a450a45dc7e17dd715de4fec85975faf382f0b38820b15e3f
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:94ad528bc4f035a06e01b84098f1f34da3d31ecbc0f178635f35a7ba40fcc77c
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d1713105c09718a5a1ccd1be23f6c6577e057e3473eb770ff3a696d0fb957b8
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e14786f7e81d4d7347dbb5e29a4e7333f1ea4df5a88ba9f97c4d35df7e3ba3ef
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:843ce9e0a160085bb2404786a6d4e815027b301170402fab469afb1c68ab479b
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -878,3 +878,43 @@
878
  {"current_steps": 4390, "total_steps": 6713, "loss": 0.18, "lr": 1.2913139082569434e-05, "epoch": 4.579029733959311, "percentage": 65.4, "elapsed_time": "16:30:53", "remaining_time": "8:44:20"}
879
  {"current_steps": 4395, "total_steps": 6713, "loss": 0.1906, "lr": 1.2864532868358799e-05, "epoch": 4.584246218049035, "percentage": 65.47, "elapsed_time": "16:33:36", "remaining_time": "8:44:02"}
880
  {"current_steps": 4400, "total_steps": 6713, "loss": 0.1788, "lr": 1.2815974898252482e-05, "epoch": 4.589462702138759, "percentage": 65.54, "elapsed_time": "16:36:22", "remaining_time": "8:43:46"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
878
  {"current_steps": 4390, "total_steps": 6713, "loss": 0.18, "lr": 1.2913139082569434e-05, "epoch": 4.579029733959311, "percentage": 65.4, "elapsed_time": "16:30:53", "remaining_time": "8:44:20"}
879
  {"current_steps": 4395, "total_steps": 6713, "loss": 0.1906, "lr": 1.2864532868358799e-05, "epoch": 4.584246218049035, "percentage": 65.47, "elapsed_time": "16:33:36", "remaining_time": "8:44:02"}
880
  {"current_steps": 4400, "total_steps": 6713, "loss": 0.1788, "lr": 1.2815974898252482e-05, "epoch": 4.589462702138759, "percentage": 65.54, "elapsed_time": "16:36:22", "remaining_time": "8:43:46"}
881
+ {"current_steps": 4405, "total_steps": 6713, "loss": 0.1903, "lr": 1.2767465500559162e-05, "epoch": 4.594679186228482, "percentage": 65.62, "elapsed_time": "16:40:11", "remaining_time": "8:44:02"}
882
+ {"current_steps": 4410, "total_steps": 6713, "loss": 0.1777, "lr": 1.271900500325911e-05, "epoch": 4.5998956703182055, "percentage": 65.69, "elapsed_time": "16:42:51", "remaining_time": "8:43:42"}
883
+ {"current_steps": 4415, "total_steps": 6713, "loss": 0.1865, "lr": 1.2670593734001972e-05, "epoch": 4.605112154407929, "percentage": 65.77, "elapsed_time": "16:45:21", "remaining_time": "8:43:17"}
884
+ {"current_steps": 4420, "total_steps": 6713, "loss": 0.1878, "lr": 1.2622232020104568e-05, "epoch": 4.610328638497653, "percentage": 65.84, "elapsed_time": "16:48:14", "remaining_time": "8:43:03"}
885
+ {"current_steps": 4425, "total_steps": 6713, "loss": 0.1886, "lr": 1.2573920188548634e-05, "epoch": 4.615545122587376, "percentage": 65.92, "elapsed_time": "16:50:59", "remaining_time": "8:42:44"}
886
+ {"current_steps": 4430, "total_steps": 6713, "loss": 0.1993, "lr": 1.2525658565978668e-05, "epoch": 4.6207616066771, "percentage": 65.99, "elapsed_time": "16:53:37", "remaining_time": "8:42:22"}
887
+ {"current_steps": 4435, "total_steps": 6713, "loss": 0.1868, "lr": 1.2477447478699696e-05, "epoch": 4.625978090766823, "percentage": 66.07, "elapsed_time": "16:56:24", "remaining_time": "8:42:03"}
888
+ {"current_steps": 4440, "total_steps": 6713, "loss": 0.1959, "lr": 1.2429287252675062e-05, "epoch": 4.631194574856547, "percentage": 66.14, "elapsed_time": "16:58:59", "remaining_time": "8:41:39"}
889
+ {"current_steps": 4445, "total_steps": 6713, "loss": 0.1864, "lr": 1.2381178213524223e-05, "epoch": 4.63641105894627, "percentage": 66.21, "elapsed_time": "17:01:35", "remaining_time": "8:41:15"}
890
+ {"current_steps": 4450, "total_steps": 6713, "loss": 0.1772, "lr": 1.2333120686520568e-05, "epoch": 4.641627543035994, "percentage": 66.29, "elapsed_time": "17:04:18", "remaining_time": "8:40:54"}
891
+ {"current_steps": 4455, "total_steps": 6713, "loss": 0.1791, "lr": 1.2285114996589181e-05, "epoch": 4.646844027125717, "percentage": 66.36, "elapsed_time": "17:07:06", "remaining_time": "8:40:35"}
892
+ {"current_steps": 4460, "total_steps": 6713, "loss": 0.1924, "lr": 1.2237161468304681e-05, "epoch": 4.652060511215441, "percentage": 66.44, "elapsed_time": "17:09:45", "remaining_time": "8:40:11"}
893
+ {"current_steps": 4465, "total_steps": 6713, "loss": 0.1851, "lr": 1.218926042588902e-05, "epoch": 4.657276995305164, "percentage": 66.51, "elapsed_time": "17:12:41", "remaining_time": "8:39:55"}
894
+ {"current_steps": 4470, "total_steps": 6713, "loss": 0.1882, "lr": 1.2141412193209274e-05, "epoch": 4.662493479394888, "percentage": 66.59, "elapsed_time": "17:15:18", "remaining_time": "8:39:30"}
895
+ {"current_steps": 4475, "total_steps": 6713, "loss": 0.1959, "lr": 1.2093617093775458e-05, "epoch": 4.6677099634846115, "percentage": 66.66, "elapsed_time": "17:18:09", "remaining_time": "8:39:11"}
896
+ {"current_steps": 4480, "total_steps": 6713, "loss": 0.1928, "lr": 1.2045875450738352e-05, "epoch": 4.672926447574335, "percentage": 66.74, "elapsed_time": "17:20:48", "remaining_time": "8:38:46"}
897
+ {"current_steps": 4485, "total_steps": 6713, "loss": 0.1834, "lr": 1.199818758688731e-05, "epoch": 4.678142931664058, "percentage": 66.81, "elapsed_time": "17:23:36", "remaining_time": "8:38:25"}
898
+ {"current_steps": 4490, "total_steps": 6713, "loss": 0.1946, "lr": 1.1950553824648077e-05, "epoch": 4.683359415753782, "percentage": 66.89, "elapsed_time": "17:26:17", "remaining_time": "8:38:01"}
899
+ {"current_steps": 4495, "total_steps": 6713, "loss": 0.1814, "lr": 1.1902974486080599e-05, "epoch": 4.688575899843506, "percentage": 66.96, "elapsed_time": "17:29:09", "remaining_time": "8:37:41"}
900
+ {"current_steps": 4500, "total_steps": 6713, "loss": 0.1953, "lr": 1.1855449892876858e-05, "epoch": 4.6937923839332285, "percentage": 67.03, "elapsed_time": "17:31:46", "remaining_time": "8:37:14"}
901
+ {"current_steps": 4505, "total_steps": 6713, "loss": 0.1795, "lr": 1.1807980366358699e-05, "epoch": 4.699008868022952, "percentage": 67.11, "elapsed_time": "17:34:37", "remaining_time": "8:36:53"}
902
+ {"current_steps": 4510, "total_steps": 6713, "loss": 0.1986, "lr": 1.1760566227475642e-05, "epoch": 4.704225352112676, "percentage": 67.18, "elapsed_time": "17:37:15", "remaining_time": "8:36:26"}
903
+ {"current_steps": 4515, "total_steps": 6713, "loss": 0.1848, "lr": 1.1713207796802739e-05, "epoch": 4.7094418362024, "percentage": 67.26, "elapsed_time": "17:39:47", "remaining_time": "8:35:55"}
904
+ {"current_steps": 4520, "total_steps": 6713, "loss": 0.2054, "lr": 1.166590539453837e-05, "epoch": 4.7146583202921235, "percentage": 67.33, "elapsed_time": "17:42:25", "remaining_time": "8:35:27"}
905
+ {"current_steps": 4525, "total_steps": 6713, "loss": 0.1785, "lr": 1.1618659340502104e-05, "epoch": 4.719874804381846, "percentage": 67.41, "elapsed_time": "17:45:11", "remaining_time": "8:35:03"}
906
+ {"current_steps": 4530, "total_steps": 6713, "loss": 0.1882, "lr": 1.157146995413252e-05, "epoch": 4.72509128847157, "percentage": 67.48, "elapsed_time": "17:47:58", "remaining_time": "8:34:39"}
907
+ {"current_steps": 4535, "total_steps": 6713, "loss": 0.1959, "lr": 1.152433755448509e-05, "epoch": 4.730307772561294, "percentage": 67.56, "elapsed_time": "17:50:44", "remaining_time": "8:34:14"}
908
+ {"current_steps": 4540, "total_steps": 6713, "loss": 0.1896, "lr": 1.1477262460229945e-05, "epoch": 4.735524256651017, "percentage": 67.63, "elapsed_time": "17:53:31", "remaining_time": "8:33:49"}
909
+ {"current_steps": 4545, "total_steps": 6713, "loss": 0.1874, "lr": 1.143024498964981e-05, "epoch": 4.7407407407407405, "percentage": 67.7, "elapsed_time": "17:56:14", "remaining_time": "8:33:22"}
910
+ {"current_steps": 4550, "total_steps": 6713, "loss": 0.1924, "lr": 1.1383285460637766e-05, "epoch": 4.745957224830464, "percentage": 67.78, "elapsed_time": "17:58:45", "remaining_time": "8:32:49"}
911
+ {"current_steps": 4555, "total_steps": 6713, "loss": 0.1889, "lr": 1.1336384190695172e-05, "epoch": 4.751173708920188, "percentage": 67.85, "elapsed_time": "18:01:35", "remaining_time": "8:32:25"}
912
+ {"current_steps": 4560, "total_steps": 6713, "loss": 0.1934, "lr": 1.1289541496929466e-05, "epoch": 4.756390193009912, "percentage": 67.93, "elapsed_time": "18:04:27", "remaining_time": "8:32:01"}
913
+ {"current_steps": 4565, "total_steps": 6713, "loss": 0.1924, "lr": 1.1242757696052044e-05, "epoch": 4.761606677099635, "percentage": 68.0, "elapsed_time": "18:06:59", "remaining_time": "8:31:28"}
914
+ {"current_steps": 4570, "total_steps": 6713, "loss": 0.1793, "lr": 1.1196033104376141e-05, "epoch": 4.766823161189358, "percentage": 68.08, "elapsed_time": "18:09:46", "remaining_time": "8:31:01"}
915
+ {"current_steps": 4575, "total_steps": 6713, "loss": 0.1924, "lr": 1.1149368037814644e-05, "epoch": 4.772039645279082, "percentage": 68.15, "elapsed_time": "18:12:31", "remaining_time": "8:30:33"}
916
+ {"current_steps": 4580, "total_steps": 6713, "loss": 0.1798, "lr": 1.1102762811877974e-05, "epoch": 4.777256129368805, "percentage": 68.23, "elapsed_time": "18:15:13", "remaining_time": "8:30:04"}
917
+ {"current_steps": 4585, "total_steps": 6713, "loss": 0.1835, "lr": 1.1056217741672e-05, "epoch": 4.782472613458529, "percentage": 68.3, "elapsed_time": "18:18:04", "remaining_time": "8:29:38"}
918
+ {"current_steps": 4590, "total_steps": 6713, "loss": 0.205, "lr": 1.1009733141895823e-05, "epoch": 4.7876890975482524, "percentage": 68.37, "elapsed_time": "18:20:48", "remaining_time": "8:29:09"}
919
+ {"current_steps": 4595, "total_steps": 6713, "loss": 0.1921, "lr": 1.0963309326839708e-05, "epoch": 4.792905581637976, "percentage": 68.45, "elapsed_time": "18:23:39", "remaining_time": "8:28:42"}
920
+ {"current_steps": 4600, "total_steps": 6713, "loss": 0.1859, "lr": 1.0916946610382966e-05, "epoch": 4.7981220657277, "percentage": 68.52, "elapsed_time": "18:26:27", "remaining_time": "8:28:15"}