Training in progress, step 5200
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4902257696
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:03ef76a6ba267115adecbd717ed5b6c3d1a42e94d2558a3d9596b02f28e38b3c
|
| 3 |
size 4902257696
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915960368
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0f2fc4496cfe38a75c60ffb6da8f9225b1f65b83fd22a1a181fbfdd4c2907ab4
|
| 3 |
size 4915960368
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4983068496
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:476c07cfbbd73d3f8ffdde332a82f1934f1c8a631e8544a01626c42b66f65380
|
| 3 |
size 4983068496
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1580230264
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0d335eb82c918d4e2523a9aa3f1a0cb3410ecc07e5e425bb972b26bc765ba0f5
|
| 3 |
size 1580230264
|
trainer_log.jsonl
CHANGED
|
@@ -1001,3 +1001,44 @@
|
|
| 1001 |
{"current_steps": 4995, "total_steps": 6188, "loss": 0.0625, "lr": 4.367893544535757e-06, "epoch": 5.65195246179966, "percentage": 80.72, "elapsed_time": "14:52:40", "remaining_time": "3:33:12"}
|
| 1002 |
{"current_steps": 5000, "total_steps": 6188, "loss": 0.0615, "lr": 4.332767381597575e-06, "epoch": 5.657611771363894, "percentage": 80.8, "elapsed_time": "14:54:11", "remaining_time": "3:32:27"}
|
| 1003 |
{"current_steps": 5005, "total_steps": 6188, "loss": 0.0647, "lr": 4.297765864365453e-06, "epoch": 5.663271080928126, "percentage": 80.88, "elapsed_time": "14:57:02", "remaining_time": "3:32:01"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1001 |
{"current_steps": 4995, "total_steps": 6188, "loss": 0.0625, "lr": 4.367893544535757e-06, "epoch": 5.65195246179966, "percentage": 80.72, "elapsed_time": "14:52:40", "remaining_time": "3:33:12"}
|
| 1002 |
{"current_steps": 5000, "total_steps": 6188, "loss": 0.0615, "lr": 4.332767381597575e-06, "epoch": 5.657611771363894, "percentage": 80.8, "elapsed_time": "14:54:11", "remaining_time": "3:32:27"}
|
| 1003 |
{"current_steps": 5005, "total_steps": 6188, "loss": 0.0647, "lr": 4.297765864365453e-06, "epoch": 5.663271080928126, "percentage": 80.88, "elapsed_time": "14:57:02", "remaining_time": "3:32:01"}
|
| 1004 |
+
{"current_steps": 5010, "total_steps": 6188, "loss": 0.1096, "lr": 4.262889271305204e-06, "epoch": 5.66893039049236, "percentage": 80.96, "elapsed_time": "14:59:18", "remaining_time": "3:31:27"}
|
| 1005 |
+
{"current_steps": 5015, "total_steps": 6188, "loss": 0.0926, "lr": 4.228137879888774e-06, "epoch": 5.674589700056593, "percentage": 81.04, "elapsed_time": "15:01:07", "remaining_time": "3:30:46"}
|
| 1006 |
+
{"current_steps": 5020, "total_steps": 6188, "loss": 0.0755, "lr": 4.193511966592041e-06, "epoch": 5.680249009620827, "percentage": 81.12, "elapsed_time": "15:02:40", "remaining_time": "3:30:01"}
|
| 1007 |
+
{"current_steps": 5025, "total_steps": 6188, "loss": 0.0911, "lr": 4.1590118068925815e-06, "epoch": 5.685908319185059, "percentage": 81.21, "elapsed_time": "15:04:22", "remaining_time": "3:29:18"}
|
| 1008 |
+
{"current_steps": 5030, "total_steps": 6188, "loss": 0.1086, "lr": 4.124637675267511e-06, "epoch": 5.691567628749293, "percentage": 81.29, "elapsed_time": "15:06:13", "remaining_time": "3:28:37"}
|
| 1009 |
+
{"current_steps": 5035, "total_steps": 6188, "loss": 0.0774, "lr": 4.090389845191278e-06, "epoch": 5.697226938313526, "percentage": 81.37, "elapsed_time": "15:07:47", "remaining_time": "3:27:52"}
|
| 1010 |
+
{"current_steps": 5040, "total_steps": 6188, "loss": 0.095, "lr": 4.056268589133516e-06, "epoch": 5.702886247877759, "percentage": 81.45, "elapsed_time": "15:09:23", "remaining_time": "3:27:08"}
|
| 1011 |
+
{"current_steps": 5045, "total_steps": 6188, "loss": 0.0772, "lr": 4.022274178556844e-06, "epoch": 5.708545557441992, "percentage": 81.53, "elapsed_time": "15:10:59", "remaining_time": "3:26:23"}
|
| 1012 |
+
{"current_steps": 5050, "total_steps": 6188, "loss": 0.0696, "lr": 3.988406883914717e-06, "epoch": 5.7142048670062255, "percentage": 81.61, "elapsed_time": "15:12:47", "remaining_time": "3:25:41"}
|
| 1013 |
+
{"current_steps": 5055, "total_steps": 6188, "loss": 0.076, "lr": 3.954666974649295e-06, "epoch": 5.719864176570458, "percentage": 81.69, "elapsed_time": "15:14:49", "remaining_time": "3:25:02"}
|
| 1014 |
+
{"current_steps": 5060, "total_steps": 6188, "loss": 0.0679, "lr": 3.921054719189272e-06, "epoch": 5.7255234861346915, "percentage": 81.77, "elapsed_time": "15:16:48", "remaining_time": "3:24:22"}
|
| 1015 |
+
{"current_steps": 5065, "total_steps": 6188, "loss": 0.0657, "lr": 3.887570384947745e-06, "epoch": 5.731182795698925, "percentage": 81.85, "elapsed_time": "15:18:27", "remaining_time": "3:23:38"}
|
| 1016 |
+
{"current_steps": 5070, "total_steps": 6188, "loss": 0.0783, "lr": 3.854214238320109e-06, "epoch": 5.7368421052631575, "percentage": 81.93, "elapsed_time": "15:20:21", "remaining_time": "3:22:57"}
|
| 1017 |
+
{"current_steps": 5075, "total_steps": 6188, "loss": 0.0818, "lr": 3.8209865446819105e-06, "epoch": 5.742501414827391, "percentage": 82.01, "elapsed_time": "15:22:20", "remaining_time": "3:22:16"}
|
| 1018 |
+
{"current_steps": 5080, "total_steps": 6188, "loss": 0.0845, "lr": 3.7878875683867476e-06, "epoch": 5.748160724391624, "percentage": 82.09, "elapsed_time": "15:23:55", "remaining_time": "3:21:30"}
|
| 1019 |
+
{"current_steps": 5085, "total_steps": 6188, "loss": 0.0697, "lr": 3.7549175727641606e-06, "epoch": 5.753820033955858, "percentage": 82.18, "elapsed_time": "15:25:34", "remaining_time": "3:20:46"}
|
| 1020 |
+
{"current_steps": 5090, "total_steps": 6188, "loss": 0.0718, "lr": 3.7220768201175615e-06, "epoch": 5.75947934352009, "percentage": 82.26, "elapsed_time": "15:27:13", "remaining_time": "3:20:01"}
|
| 1021 |
+
{"current_steps": 5095, "total_steps": 6188, "loss": 0.0798, "lr": 3.689365571722112e-06, "epoch": 5.765138653084324, "percentage": 82.34, "elapsed_time": "15:29:00", "remaining_time": "3:19:17"}
|
| 1022 |
+
{"current_steps": 5100, "total_steps": 6188, "loss": 0.0592, "lr": 3.6567840878226577e-06, "epoch": 5.770797962648556, "percentage": 82.42, "elapsed_time": "15:30:34", "remaining_time": "3:18:31"}
|
| 1023 |
+
{"current_steps": 5105, "total_steps": 6188, "loss": 0.0763, "lr": 3.624332627631679e-06, "epoch": 5.77645727221279, "percentage": 82.5, "elapsed_time": "15:32:08", "remaining_time": "3:17:44"}
|
| 1024 |
+
{"current_steps": 5110, "total_steps": 6188, "loss": 0.0745, "lr": 3.5920114493271974e-06, "epoch": 5.782116581777023, "percentage": 82.58, "elapsed_time": "15:33:47", "remaining_time": "3:16:59"}
|
| 1025 |
+
{"current_steps": 5115, "total_steps": 6188, "loss": 0.0847, "lr": 3.5598208100507314e-06, "epoch": 5.787775891341257, "percentage": 82.66, "elapsed_time": "15:35:33", "remaining_time": "3:16:15"}
|
| 1026 |
+
{"current_steps": 5120, "total_steps": 6188, "loss": 0.0754, "lr": 3.5277609659052712e-06, "epoch": 5.793435200905489, "percentage": 82.74, "elapsed_time": "15:37:16", "remaining_time": "3:15:30"}
|
| 1027 |
+
{"current_steps": 5125, "total_steps": 6188, "loss": 0.0807, "lr": 3.4958321719532106e-06, "epoch": 5.799094510469723, "percentage": 82.82, "elapsed_time": "15:38:45", "remaining_time": "3:14:42"}
|
| 1028 |
+
{"current_steps": 5130, "total_steps": 6188, "loss": 0.0763, "lr": 3.4640346822143324e-06, "epoch": 5.804753820033956, "percentage": 82.9, "elapsed_time": "15:40:34", "remaining_time": "3:13:58"}
|
| 1029 |
+
{"current_steps": 5135, "total_steps": 6188, "loss": 0.0834, "lr": 3.4323687496637837e-06, "epoch": 5.810413129598189, "percentage": 82.98, "elapsed_time": "15:42:18", "remaining_time": "3:13:13"}
|
| 1030 |
+
{"current_steps": 5140, "total_steps": 6188, "loss": 0.0748, "lr": 3.4008346262300852e-06, "epoch": 5.816072439162422, "percentage": 83.06, "elapsed_time": "15:43:55", "remaining_time": "3:12:27"}
|
| 1031 |
+
{"current_steps": 5145, "total_steps": 6188, "loss": 0.0674, "lr": 3.3694325627930846e-06, "epoch": 5.8217317487266556, "percentage": 83.14, "elapsed_time": "15:45:23", "remaining_time": "3:11:38"}
|
| 1032 |
+
{"current_steps": 5150, "total_steps": 6188, "loss": 0.0877, "lr": 3.3381628091819907e-06, "epoch": 5.827391058290889, "percentage": 83.23, "elapsed_time": "15:47:22", "remaining_time": "3:10:56"}
|
| 1033 |
+
{"current_steps": 5155, "total_steps": 6188, "loss": 0.0668, "lr": 3.3070256141733913e-06, "epoch": 5.8330503678551215, "percentage": 83.31, "elapsed_time": "15:49:00", "remaining_time": "3:10:10"}
|
| 1034 |
+
{"current_steps": 5160, "total_steps": 6188, "loss": 0.0663, "lr": 3.2760212254892453e-06, "epoch": 5.838709677419355, "percentage": 83.39, "elapsed_time": "15:50:48", "remaining_time": "3:09:25"}
|
| 1035 |
+
{"current_steps": 5165, "total_steps": 6188, "loss": 0.0755, "lr": 3.245149889794932e-06, "epoch": 5.8443689869835875, "percentage": 83.47, "elapsed_time": "15:52:38", "remaining_time": "3:08:41"}
|
| 1036 |
+
{"current_steps": 5170, "total_steps": 6188, "loss": 0.0609, "lr": 3.2144118526972943e-06, "epoch": 5.850028296547821, "percentage": 83.55, "elapsed_time": "15:54:18", "remaining_time": "3:07:54"}
|
| 1037 |
+
{"current_steps": 5175, "total_steps": 6188, "loss": 0.0612, "lr": 3.1838073587426676e-06, "epoch": 5.855687606112054, "percentage": 83.63, "elapsed_time": "15:55:54", "remaining_time": "3:07:06"}
|
| 1038 |
+
{"current_steps": 5180, "total_steps": 6188, "loss": 0.079, "lr": 3.153336651414933e-06, "epoch": 5.861346915676288, "percentage": 83.71, "elapsed_time": "15:57:34", "remaining_time": "3:06:20"}
|
| 1039 |
+
{"current_steps": 5185, "total_steps": 6188, "loss": 0.0941, "lr": 3.1229999731336137e-06, "epoch": 5.86700622524052, "percentage": 83.79, "elapsed_time": "15:59:25", "remaining_time": "3:05:35"}
|
| 1040 |
+
{"current_steps": 5190, "total_steps": 6188, "loss": 0.0713, "lr": 3.0927975652518994e-06, "epoch": 5.872665534804754, "percentage": 83.87, "elapsed_time": "16:01:00", "remaining_time": "3:04:47"}
|
| 1041 |
+
{"current_steps": 5195, "total_steps": 6188, "loss": 0.0797, "lr": 3.062729668054756e-06, "epoch": 5.878324844368987, "percentage": 83.95, "elapsed_time": "16:02:37", "remaining_time": "3:04:00"}
|
| 1042 |
+
{"current_steps": 5200, "total_steps": 6188, "loss": 0.0904, "lr": 3.032796520757002e-06, "epoch": 5.88398415393322, "percentage": 84.03, "elapsed_time": "16:04:12", "remaining_time": "3:03:11"}
|
| 1043 |
+
{"current_steps": 5205, "total_steps": 6188, "loss": 0.0683, "lr": 3.0029983615014234e-06, "epoch": 5.889643463497453, "percentage": 84.11, "elapsed_time": "16:06:55", "remaining_time": "3:02:36"}
|
| 1044 |
+
{"current_steps": 5210, "total_steps": 6188, "loss": 0.0739, "lr": 2.9733354273568514e-06, "epoch": 5.895302773061687, "percentage": 84.2, "elapsed_time": "16:08:29", "remaining_time": "3:01:48"}
|