Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2f83b6ec3e0c440e893d30b0c1742fa41604a806777236bc2666e184a7becc32
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6ce5eea1dd417148f094d986a272fe5c0acbd8f0ab164fa256d8127dec312f77
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b4fab5cc499300593d0ffde9ee3c478f56356b65d662f42f468d24bab782e3e1
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:10017a208b0ebc8bba8bdb1396e92834259e4f8d639ff9721af7dbbe835196f5
|
| 3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
|
@@ -64,3 +64,34 @@
|
|
| 64 |
{"current_steps": 630, "total_steps": 957, "loss": 0.6588, "lr": 5e-06, "epoch": 1.9733750978856697, "percentage": 65.83, "elapsed_time": "10:15:39", "remaining_time": "5:19:33"}
|
| 65 |
{"current_steps": 638, "total_steps": 957, "eval_loss": 0.6915597319602966, "epoch": 1.9984338292873924, "percentage": 66.67, "elapsed_time": "10:29:32", "remaining_time": "5:14:46"}
|
| 66 |
{"current_steps": 640, "total_steps": 957, "loss": 0.7005, "lr": 5e-06, "epoch": 2.004698512137823, "percentage": 66.88, "elapsed_time": "10:32:10", "remaining_time": "5:13:07"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 64 |
{"current_steps": 630, "total_steps": 957, "loss": 0.6588, "lr": 5e-06, "epoch": 1.9733750978856697, "percentage": 65.83, "elapsed_time": "10:15:39", "remaining_time": "5:19:33"}
|
| 65 |
{"current_steps": 638, "total_steps": 957, "eval_loss": 0.6915597319602966, "epoch": 1.9984338292873924, "percentage": 66.67, "elapsed_time": "10:29:32", "remaining_time": "5:14:46"}
|
| 66 |
{"current_steps": 640, "total_steps": 957, "loss": 0.7005, "lr": 5e-06, "epoch": 2.004698512137823, "percentage": 66.88, "elapsed_time": "10:32:10", "remaining_time": "5:13:07"}
|
| 67 |
+
{"current_steps": 650, "total_steps": 957, "loss": 0.61, "lr": 5e-06, "epoch": 2.0360219263899766, "percentage": 67.92, "elapsed_time": "10:41:48", "remaining_time": "5:03:08"}
|
| 68 |
+
{"current_steps": 660, "total_steps": 957, "loss": 0.6129, "lr": 5e-06, "epoch": 2.06734534064213, "percentage": 68.97, "elapsed_time": "10:51:28", "remaining_time": "4:53:09"}
|
| 69 |
+
{"current_steps": 670, "total_steps": 957, "loss": 0.6073, "lr": 5e-06, "epoch": 2.0986687548942835, "percentage": 70.01, "elapsed_time": "11:01:08", "remaining_time": "4:43:12"}
|
| 70 |
+
{"current_steps": 680, "total_steps": 957, "loss": 0.6069, "lr": 5e-06, "epoch": 2.129992169146437, "percentage": 71.06, "elapsed_time": "11:10:47", "remaining_time": "4:33:15"}
|
| 71 |
+
{"current_steps": 690, "total_steps": 957, "loss": 0.6115, "lr": 5e-06, "epoch": 2.1613155833985904, "percentage": 72.1, "elapsed_time": "11:20:26", "remaining_time": "4:23:18"}
|
| 72 |
+
{"current_steps": 700, "total_steps": 957, "loss": 0.6083, "lr": 5e-06, "epoch": 2.192638997650744, "percentage": 73.15, "elapsed_time": "11:30:05", "remaining_time": "4:13:21"}
|
| 73 |
+
{"current_steps": 710, "total_steps": 957, "loss": 0.6055, "lr": 5e-06, "epoch": 2.2239624119028973, "percentage": 74.19, "elapsed_time": "11:39:44", "remaining_time": "4:03:25"}
|
| 74 |
+
{"current_steps": 720, "total_steps": 957, "loss": 0.612, "lr": 5e-06, "epoch": 2.255285826155051, "percentage": 75.24, "elapsed_time": "11:49:23", "remaining_time": "3:53:30"}
|
| 75 |
+
{"current_steps": 730, "total_steps": 957, "loss": 0.6119, "lr": 5e-06, "epoch": 2.2866092404072043, "percentage": 76.28, "elapsed_time": "11:59:03", "remaining_time": "3:43:35"}
|
| 76 |
+
{"current_steps": 740, "total_steps": 957, "loss": 0.6113, "lr": 5e-06, "epoch": 2.3179326546593577, "percentage": 77.32, "elapsed_time": "12:08:42", "remaining_time": "3:33:41"}
|
| 77 |
+
{"current_steps": 750, "total_steps": 957, "loss": 0.6111, "lr": 5e-06, "epoch": 2.349256068911511, "percentage": 78.37, "elapsed_time": "12:18:20", "remaining_time": "3:23:46"}
|
| 78 |
+
{"current_steps": 760, "total_steps": 957, "loss": 0.6121, "lr": 5e-06, "epoch": 2.3805794831636646, "percentage": 79.41, "elapsed_time": "12:27:59", "remaining_time": "3:13:53"}
|
| 79 |
+
{"current_steps": 770, "total_steps": 957, "loss": 0.6159, "lr": 5e-06, "epoch": 2.4119028974158185, "percentage": 80.46, "elapsed_time": "12:37:38", "remaining_time": "3:03:59"}
|
| 80 |
+
{"current_steps": 780, "total_steps": 957, "loss": 0.6142, "lr": 5e-06, "epoch": 2.443226311667972, "percentage": 81.5, "elapsed_time": "12:47:17", "remaining_time": "2:54:06"}
|
| 81 |
+
{"current_steps": 790, "total_steps": 957, "loss": 0.6181, "lr": 5e-06, "epoch": 2.4745497259201255, "percentage": 82.55, "elapsed_time": "12:56:56", "remaining_time": "2:44:14"}
|
| 82 |
+
{"current_steps": 800, "total_steps": 957, "loss": 0.6127, "lr": 5e-06, "epoch": 2.505873140172279, "percentage": 83.59, "elapsed_time": "13:06:34", "remaining_time": "2:34:21"}
|
| 83 |
+
{"current_steps": 810, "total_steps": 957, "loss": 0.6192, "lr": 5e-06, "epoch": 2.5371965544244324, "percentage": 84.64, "elapsed_time": "13:16:13", "remaining_time": "2:24:29"}
|
| 84 |
+
{"current_steps": 820, "total_steps": 957, "loss": 0.6098, "lr": 5e-06, "epoch": 2.568519968676586, "percentage": 85.68, "elapsed_time": "13:25:51", "remaining_time": "2:14:38"}
|
| 85 |
+
{"current_steps": 830, "total_steps": 957, "loss": 0.6126, "lr": 5e-06, "epoch": 2.5998433829287393, "percentage": 86.73, "elapsed_time": "13:35:28", "remaining_time": "2:04:46"}
|
| 86 |
+
{"current_steps": 840, "total_steps": 957, "loss": 0.618, "lr": 5e-06, "epoch": 2.6311667971808927, "percentage": 87.77, "elapsed_time": "13:45:06", "remaining_time": "1:54:55"}
|
| 87 |
+
{"current_steps": 850, "total_steps": 957, "loss": 0.6132, "lr": 5e-06, "epoch": 2.662490211433046, "percentage": 88.82, "elapsed_time": "13:54:45", "remaining_time": "1:45:04"}
|
| 88 |
+
{"current_steps": 860, "total_steps": 957, "loss": 0.6211, "lr": 5e-06, "epoch": 2.6938136256851997, "percentage": 89.86, "elapsed_time": "14:04:24", "remaining_time": "1:35:14"}
|
| 89 |
+
{"current_steps": 870, "total_steps": 957, "loss": 0.6072, "lr": 5e-06, "epoch": 2.725137039937353, "percentage": 90.91, "elapsed_time": "14:14:04", "remaining_time": "1:25:24"}
|
| 90 |
+
{"current_steps": 880, "total_steps": 957, "loss": 0.6181, "lr": 5e-06, "epoch": 2.7564604541895066, "percentage": 91.95, "elapsed_time": "14:23:43", "remaining_time": "1:15:34"}
|
| 91 |
+
{"current_steps": 890, "total_steps": 957, "loss": 0.6183, "lr": 5e-06, "epoch": 2.78778386844166, "percentage": 93.0, "elapsed_time": "14:33:23", "remaining_time": "1:05:44"}
|
| 92 |
+
{"current_steps": 900, "total_steps": 957, "loss": 0.6185, "lr": 5e-06, "epoch": 2.8191072826938135, "percentage": 94.04, "elapsed_time": "14:43:02", "remaining_time": "0:55:55"}
|
| 93 |
+
{"current_steps": 910, "total_steps": 957, "loss": 0.6113, "lr": 5e-06, "epoch": 2.850430696945967, "percentage": 95.09, "elapsed_time": "14:52:41", "remaining_time": "0:46:06"}
|
| 94 |
+
{"current_steps": 920, "total_steps": 957, "loss": 0.613, "lr": 5e-06, "epoch": 2.881754111198121, "percentage": 96.13, "elapsed_time": "15:02:20", "remaining_time": "0:36:17"}
|
| 95 |
+
{"current_steps": 930, "total_steps": 957, "loss": 0.6178, "lr": 5e-06, "epoch": 2.913077525450274, "percentage": 97.18, "elapsed_time": "15:12:00", "remaining_time": "0:26:28"}
|
| 96 |
+
{"current_steps": 940, "total_steps": 957, "loss": 0.6157, "lr": 5e-06, "epoch": 2.9444009397024278, "percentage": 98.22, "elapsed_time": "15:21:40", "remaining_time": "0:16:40"}
|
| 97 |
+
{"current_steps": 950, "total_steps": 957, "loss": 0.6176, "lr": 5e-06, "epoch": 2.975724353954581, "percentage": 99.27, "elapsed_time": "15:31:18", "remaining_time": "0:06:51"}
|