penfever commited on
Commit
9d7b56e
·
verified ·
1 Parent(s): b1e02a2

Training in progress, step 4200

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:815ecdc95f7a5beb413d8c14b8d3a754263e3ee116d3edd0ef78f2d90364dc39
3
  size 4902257696
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:174e880aecaaa9b374eb3cca3e9c9120e191774903a149f74ae874cecdffebe8
3
  size 4902257696
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ca495972ac8e16ee0b46c12742c2f851b126d5063faa7498991de37fe2a222d2
3
  size 4915960368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:030a4a35407284dfecaf4d479706f5b0e015e4d04f83d168fb458778f6580fed
3
  size 4915960368
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bed0b890c99c700853d0309386871dfe61798252ff9aa38db0b9b25f92ffdff6
3
  size 4983068496
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b45d563800af7092cef613f419f50191cdc9eddb61dc0f68f1cf8433fe5a3fc8
3
  size 4983068496
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f534755dcea0e087973e8d0f3fe1d00446667426886019296460277ad48658c
3
  size 1580230264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d7b9350185fb70ac529ec8784625ee8ced48b6d22f4e0757e86665a054bdf2e
3
  size 1580230264
trainer_log.jsonl CHANGED
@@ -803,3 +803,43 @@
803
  {"current_steps": 3990, "total_steps": 6188, "loss": 0.0752, "lr": 1.3513593246732506e-05, "epoch": 4.514997170345218, "percentage": 64.48, "elapsed_time": "6:02:59", "remaining_time": "3:19:58"}
804
  {"current_steps": 3995, "total_steps": 6188, "loss": 0.0915, "lr": 1.3460256197794768e-05, "epoch": 4.5206564799094515, "percentage": 64.56, "elapsed_time": "6:04:32", "remaining_time": "3:20:06"}
805
  {"current_steps": 4000, "total_steps": 6188, "loss": 0.0746, "lr": 1.3406971177891343e-05, "epoch": 4.526315789473684, "percentage": 64.64, "elapsed_time": "6:06:07", "remaining_time": "3:20:16"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
803
  {"current_steps": 3990, "total_steps": 6188, "loss": 0.0752, "lr": 1.3513593246732506e-05, "epoch": 4.514997170345218, "percentage": 64.48, "elapsed_time": "6:02:59", "remaining_time": "3:19:58"}
804
  {"current_steps": 3995, "total_steps": 6188, "loss": 0.0915, "lr": 1.3460256197794768e-05, "epoch": 4.5206564799094515, "percentage": 64.56, "elapsed_time": "6:04:32", "remaining_time": "3:20:06"}
805
  {"current_steps": 4000, "total_steps": 6188, "loss": 0.0746, "lr": 1.3406971177891343e-05, "epoch": 4.526315789473684, "percentage": 64.64, "elapsed_time": "6:06:07", "remaining_time": "3:20:16"}
806
+ {"current_steps": 4005, "total_steps": 6188, "loss": 0.0755, "lr": 1.3353738610948347e-05, "epoch": 4.5319750990379175, "percentage": 64.72, "elapsed_time": "6:08:56", "remaining_time": "3:21:06"}
807
+ {"current_steps": 4010, "total_steps": 6188, "loss": 0.089, "lr": 1.3300558920474586e-05, "epoch": 4.53763440860215, "percentage": 64.8, "elapsed_time": "6:10:31", "remaining_time": "3:21:14"}
808
+ {"current_steps": 4015, "total_steps": 6188, "loss": 0.0696, "lr": 1.3247432529558175e-05, "epoch": 4.5432937181663835, "percentage": 64.88, "elapsed_time": "6:12:34", "remaining_time": "3:21:38"}
809
+ {"current_steps": 4020, "total_steps": 6188, "loss": 0.0764, "lr": 1.3194359860863201e-05, "epoch": 4.548953027730617, "percentage": 64.96, "elapsed_time": "6:14:20", "remaining_time": "3:21:52"}
810
+ {"current_steps": 4025, "total_steps": 6188, "loss": 0.0741, "lr": 1.3141341336626336e-05, "epoch": 4.55461233729485, "percentage": 65.05, "elapsed_time": "6:16:11", "remaining_time": "3:22:09"}
811
+ {"current_steps": 4030, "total_steps": 6188, "loss": 0.1747, "lr": 1.3088377378653503e-05, "epoch": 4.560271646859083, "percentage": 65.13, "elapsed_time": "6:19:08", "remaining_time": "3:23:01"}
812
+ {"current_steps": 4035, "total_steps": 6188, "loss": 0.0731, "lr": 1.3035468408316501e-05, "epoch": 4.565930956423316, "percentage": 65.21, "elapsed_time": "6:20:43", "remaining_time": "3:23:08"}
813
+ {"current_steps": 4040, "total_steps": 6188, "loss": 0.0842, "lr": 1.2982614846549639e-05, "epoch": 4.57159026598755, "percentage": 65.29, "elapsed_time": "6:22:33", "remaining_time": "3:23:24"}
814
+ {"current_steps": 4045, "total_steps": 6188, "loss": 0.1049, "lr": 1.2929817113846428e-05, "epoch": 4.577249575551782, "percentage": 65.37, "elapsed_time": "6:24:29", "remaining_time": "3:23:41"}
815
+ {"current_steps": 4050, "total_steps": 6188, "loss": 0.1585, "lr": 1.287707563025621e-05, "epoch": 4.582908885116016, "percentage": 65.45, "elapsed_time": "6:27:21", "remaining_time": "3:24:29"}
816
+ {"current_steps": 4055, "total_steps": 6188, "loss": 0.158, "lr": 1.2824390815380805e-05, "epoch": 4.588568194680249, "percentage": 65.53, "elapsed_time": "6:30:17", "remaining_time": "3:25:18"}
817
+ {"current_steps": 4060, "total_steps": 6188, "loss": 0.1529, "lr": 1.2771763088371202e-05, "epoch": 4.594227504244482, "percentage": 65.61, "elapsed_time": "6:33:16", "remaining_time": "3:26:07"}
818
+ {"current_steps": 4065, "total_steps": 6188, "loss": 0.1535, "lr": 1.2719192867924197e-05, "epoch": 4.599886813808715, "percentage": 65.69, "elapsed_time": "6:36:12", "remaining_time": "3:26:55"}
819
+ {"current_steps": 4070, "total_steps": 6188, "loss": 0.1609, "lr": 1.2666680572279083e-05, "epoch": 4.605546123372949, "percentage": 65.77, "elapsed_time": "6:39:09", "remaining_time": "3:27:42"}
820
+ {"current_steps": 4075, "total_steps": 6188, "loss": 0.1595, "lr": 1.2614226619214317e-05, "epoch": 4.611205432937181, "percentage": 65.85, "elapsed_time": "6:42:14", "remaining_time": "3:28:34"}
821
+ {"current_steps": 4080, "total_steps": 6188, "loss": 0.1579, "lr": 1.2561831426044173e-05, "epoch": 4.616864742501415, "percentage": 65.93, "elapsed_time": "6:45:11", "remaining_time": "3:29:21"}
822
+ {"current_steps": 4085, "total_steps": 6188, "loss": 0.1579, "lr": 1.250949540961547e-05, "epoch": 4.622524052065648, "percentage": 66.01, "elapsed_time": "6:48:11", "remaining_time": "3:30:08"}
823
+ {"current_steps": 4090, "total_steps": 6188, "loss": 0.164, "lr": 1.2457218986304196e-05, "epoch": 4.6281833616298815, "percentage": 66.1, "elapsed_time": "6:51:01", "remaining_time": "3:30:50"}
824
+ {"current_steps": 4095, "total_steps": 6188, "loss": 0.1508, "lr": 1.2405002572012252e-05, "epoch": 4.633842671194114, "percentage": 66.18, "elapsed_time": "6:54:02", "remaining_time": "3:31:37"}
825
+ {"current_steps": 4100, "total_steps": 6188, "loss": 0.1613, "lr": 1.2352846582164117e-05, "epoch": 4.6395019807583475, "percentage": 66.26, "elapsed_time": "6:56:53", "remaining_time": "3:32:18"}
826
+ {"current_steps": 4105, "total_steps": 6188, "loss": 0.1477, "lr": 1.2300751431703523e-05, "epoch": 4.645161290322581, "percentage": 66.34, "elapsed_time": "6:59:39", "remaining_time": "3:32:56"}
827
+ {"current_steps": 4110, "total_steps": 6188, "loss": 0.1564, "lr": 1.2248717535090196e-05, "epoch": 4.6508205998868135, "percentage": 66.42, "elapsed_time": "7:02:44", "remaining_time": "3:33:44"}
828
+ {"current_steps": 4115, "total_steps": 6188, "loss": 0.1397, "lr": 1.2196745306296522e-05, "epoch": 4.656479909451047, "percentage": 66.5, "elapsed_time": "7:05:40", "remaining_time": "3:34:26"}
829
+ {"current_steps": 4120, "total_steps": 6188, "loss": 0.1421, "lr": 1.2144835158804282e-05, "epoch": 4.66213921901528, "percentage": 66.58, "elapsed_time": "7:08:22", "remaining_time": "3:35:01"}
830
+ {"current_steps": 4125, "total_steps": 6188, "loss": 0.157, "lr": 1.2092987505601346e-05, "epoch": 4.667798528579513, "percentage": 66.66, "elapsed_time": "7:11:19", "remaining_time": "3:35:42"}
831
+ {"current_steps": 4130, "total_steps": 6188, "loss": 0.1517, "lr": 1.2041202759178381e-05, "epoch": 4.673457838143746, "percentage": 66.74, "elapsed_time": "7:14:09", "remaining_time": "3:36:20"}
832
+ {"current_steps": 4135, "total_steps": 6188, "loss": 0.1384, "lr": 1.198948133152559e-05, "epoch": 4.67911714770798, "percentage": 66.82, "elapsed_time": "7:17:14", "remaining_time": "3:37:05"}
833
+ {"current_steps": 4140, "total_steps": 6188, "loss": 0.1358, "lr": 1.1937823634129416e-05, "epoch": 4.684776457272212, "percentage": 66.9, "elapsed_time": "7:20:18", "remaining_time": "3:37:49"}
834
+ {"current_steps": 4145, "total_steps": 6188, "loss": 0.148, "lr": 1.1886230077969278e-05, "epoch": 4.690435766836446, "percentage": 66.98, "elapsed_time": "7:23:22", "remaining_time": "3:38:31"}
835
+ {"current_steps": 4150, "total_steps": 6188, "loss": 0.1673, "lr": 1.1834701073514306e-05, "epoch": 4.696095076400679, "percentage": 67.07, "elapsed_time": "7:26:20", "remaining_time": "3:39:11"}
836
+ {"current_steps": 4155, "total_steps": 6188, "loss": 0.1474, "lr": 1.1783237030720049e-05, "epoch": 4.701754385964913, "percentage": 67.15, "elapsed_time": "7:29:15", "remaining_time": "3:39:49"}
837
+ {"current_steps": 4160, "total_steps": 6188, "loss": 0.1518, "lr": 1.1731838359025261e-05, "epoch": 4.707413695529145, "percentage": 67.23, "elapsed_time": "7:32:17", "remaining_time": "3:40:29"}
838
+ {"current_steps": 4165, "total_steps": 6188, "loss": 0.159, "lr": 1.1680505467348584e-05, "epoch": 4.713073005093379, "percentage": 67.31, "elapsed_time": "7:35:14", "remaining_time": "3:41:06"}
839
+ {"current_steps": 4170, "total_steps": 6188, "loss": 0.1773, "lr": 1.162923876408535e-05, "epoch": 4.718732314657612, "percentage": 67.39, "elapsed_time": "7:38:05", "remaining_time": "3:41:40"}
840
+ {"current_steps": 4175, "total_steps": 6188, "loss": 0.1793, "lr": 1.1578038657104295e-05, "epoch": 4.724391624221845, "percentage": 67.47, "elapsed_time": "7:41:03", "remaining_time": "3:42:18"}
841
+ {"current_steps": 4180, "total_steps": 6188, "loss": 0.1515, "lr": 1.1526905553744337e-05, "epoch": 4.730050933786078, "percentage": 67.55, "elapsed_time": "7:44:10", "remaining_time": "3:42:58"}
842
+ {"current_steps": 4185, "total_steps": 6188, "loss": 0.1549, "lr": 1.1475839860811301e-05, "epoch": 4.7357102433503115, "percentage": 67.63, "elapsed_time": "7:47:13", "remaining_time": "3:43:37"}
843
+ {"current_steps": 4190, "total_steps": 6188, "loss": 0.1568, "lr": 1.142484198457475e-05, "epoch": 4.741369552914544, "percentage": 67.71, "elapsed_time": "7:50:17", "remaining_time": "3:44:15"}
844
+ {"current_steps": 4195, "total_steps": 6188, "loss": 0.1618, "lr": 1.1373912330764671e-05, "epoch": 4.7470288624787775, "percentage": 67.79, "elapsed_time": "7:53:12", "remaining_time": "3:44:48"}
845
+ {"current_steps": 4200, "total_steps": 6188, "loss": 0.1482, "lr": 1.1323051304568292e-05, "epoch": 4.752688172043011, "percentage": 67.87, "elapsed_time": "7:56:15", "remaining_time": "3:45:25"}