Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2bef87fe08aa759c4f245e8f5348e32e219426d6c11855102d110bc59c7dc3c1
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cf1943712ee28f0653b95a796d6b1a976e019a3dc424fa07b30419463f9c210f
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:35fbac87a642c80bb2261b3d16a394bf137e2304a553db7c38342914d49bca90
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:138fd35b40889eda902fb945fdd365bb9c42936f2d52a029a05d84daf0b9fdfd
|
| 3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
|
@@ -57,3 +57,31 @@
|
|
| 57 |
{"current_steps": 560, "total_steps": 852, "loss": 0.6783, "lr": 5e-06, "epoch": 1.968804920913884, "percentage": 65.73, "elapsed_time": "9:07:35", "remaining_time": "4:45:31"}
|
| 58 |
{"current_steps": 568, "total_steps": 852, "eval_loss": 0.7088373899459839, "epoch": 1.9969244288224957, "percentage": 66.67, "elapsed_time": "9:21:03", "remaining_time": "4:40:31"}
|
| 59 |
{"current_steps": 570, "total_steps": 852, "loss": 0.7079, "lr": 5e-06, "epoch": 2.0043936731107204, "percentage": 66.9, "elapsed_time": "9:23:32", "remaining_time": "4:38:48"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 57 |
{"current_steps": 560, "total_steps": 852, "loss": 0.6783, "lr": 5e-06, "epoch": 1.968804920913884, "percentage": 65.73, "elapsed_time": "9:07:35", "remaining_time": "4:45:31"}
|
| 58 |
{"current_steps": 568, "total_steps": 852, "eval_loss": 0.7088373899459839, "epoch": 1.9969244288224957, "percentage": 66.67, "elapsed_time": "9:21:03", "remaining_time": "4:40:31"}
|
| 59 |
{"current_steps": 570, "total_steps": 852, "loss": 0.7079, "lr": 5e-06, "epoch": 2.0043936731107204, "percentage": 66.9, "elapsed_time": "9:23:32", "remaining_time": "4:38:48"}
|
| 60 |
+
{"current_steps": 580, "total_steps": 852, "loss": 0.6203, "lr": 5e-06, "epoch": 2.039543057996485, "percentage": 68.08, "elapsed_time": "9:33:13", "remaining_time": "4:28:49"}
|
| 61 |
+
{"current_steps": 590, "total_steps": 852, "loss": 0.6244, "lr": 5e-06, "epoch": 2.0746924428822497, "percentage": 69.25, "elapsed_time": "9:42:53", "remaining_time": "4:18:50"}
|
| 62 |
+
{"current_steps": 600, "total_steps": 852, "loss": 0.6189, "lr": 5e-06, "epoch": 2.109841827768014, "percentage": 70.42, "elapsed_time": "9:52:33", "remaining_time": "4:08:52"}
|
| 63 |
+
{"current_steps": 610, "total_steps": 852, "loss": 0.6207, "lr": 5e-06, "epoch": 2.1449912126537787, "percentage": 71.6, "elapsed_time": "10:02:12", "remaining_time": "3:58:54"}
|
| 64 |
+
{"current_steps": 620, "total_steps": 852, "loss": 0.6203, "lr": 5e-06, "epoch": 2.180140597539543, "percentage": 72.77, "elapsed_time": "10:11:53", "remaining_time": "3:48:58"}
|
| 65 |
+
{"current_steps": 630, "total_steps": 852, "loss": 0.6281, "lr": 5e-06, "epoch": 2.2152899824253076, "percentage": 73.94, "elapsed_time": "10:21:32", "remaining_time": "3:39:01"}
|
| 66 |
+
{"current_steps": 640, "total_steps": 852, "loss": 0.6246, "lr": 5e-06, "epoch": 2.2504393673110723, "percentage": 75.12, "elapsed_time": "10:31:12", "remaining_time": "3:29:05"}
|
| 67 |
+
{"current_steps": 650, "total_steps": 852, "loss": 0.6277, "lr": 5e-06, "epoch": 2.2855887521968365, "percentage": 76.29, "elapsed_time": "10:40:52", "remaining_time": "3:19:09"}
|
| 68 |
+
{"current_steps": 660, "total_steps": 852, "loss": 0.631, "lr": 5e-06, "epoch": 2.3207381370826012, "percentage": 77.46, "elapsed_time": "10:50:32", "remaining_time": "3:09:14"}
|
| 69 |
+
{"current_steps": 670, "total_steps": 852, "loss": 0.627, "lr": 5e-06, "epoch": 2.3558875219683655, "percentage": 78.64, "elapsed_time": "11:00:11", "remaining_time": "2:59:20"}
|
| 70 |
+
{"current_steps": 680, "total_steps": 852, "loss": 0.6252, "lr": 5e-06, "epoch": 2.39103690685413, "percentage": 79.81, "elapsed_time": "11:09:51", "remaining_time": "2:49:26"}
|
| 71 |
+
{"current_steps": 690, "total_steps": 852, "loss": 0.631, "lr": 5e-06, "epoch": 2.4261862917398944, "percentage": 80.99, "elapsed_time": "11:19:31", "remaining_time": "2:39:32"}
|
| 72 |
+
{"current_steps": 700, "total_steps": 852, "loss": 0.6238, "lr": 5e-06, "epoch": 2.461335676625659, "percentage": 82.16, "elapsed_time": "11:29:11", "remaining_time": "2:29:39"}
|
| 73 |
+
{"current_steps": 710, "total_steps": 852, "loss": 0.6244, "lr": 5e-06, "epoch": 2.4964850615114234, "percentage": 83.33, "elapsed_time": "11:38:50", "remaining_time": "2:19:46"}
|
| 74 |
+
{"current_steps": 720, "total_steps": 852, "loss": 0.6254, "lr": 5e-06, "epoch": 2.531634446397188, "percentage": 84.51, "elapsed_time": "11:48:26", "remaining_time": "2:09:52"}
|
| 75 |
+
{"current_steps": 730, "total_steps": 852, "loss": 0.6248, "lr": 5e-06, "epoch": 2.5667838312829527, "percentage": 85.68, "elapsed_time": "11:58:06", "remaining_time": "2:00:00"}
|
| 76 |
+
{"current_steps": 740, "total_steps": 852, "loss": 0.6256, "lr": 5e-06, "epoch": 2.601933216168717, "percentage": 86.85, "elapsed_time": "12:07:46", "remaining_time": "1:50:08"}
|
| 77 |
+
{"current_steps": 750, "total_steps": 852, "loss": 0.6286, "lr": 5e-06, "epoch": 2.6370826010544817, "percentage": 88.03, "elapsed_time": "12:17:26", "remaining_time": "1:40:17"}
|
| 78 |
+
{"current_steps": 760, "total_steps": 852, "loss": 0.628, "lr": 5e-06, "epoch": 2.672231985940246, "percentage": 89.2, "elapsed_time": "12:27:04", "remaining_time": "1:30:26"}
|
| 79 |
+
{"current_steps": 770, "total_steps": 852, "loss": 0.6267, "lr": 5e-06, "epoch": 2.7073813708260106, "percentage": 90.38, "elapsed_time": "12:36:44", "remaining_time": "1:20:35"}
|
| 80 |
+
{"current_steps": 780, "total_steps": 852, "loss": 0.6261, "lr": 5e-06, "epoch": 2.7425307557117753, "percentage": 91.55, "elapsed_time": "12:46:25", "remaining_time": "1:10:44"}
|
| 81 |
+
{"current_steps": 790, "total_steps": 852, "loss": 0.6256, "lr": 5e-06, "epoch": 2.7776801405975395, "percentage": 92.72, "elapsed_time": "12:56:04", "remaining_time": "1:00:54"}
|
| 82 |
+
{"current_steps": 800, "total_steps": 852, "loss": 0.6247, "lr": 5e-06, "epoch": 2.812829525483304, "percentage": 93.9, "elapsed_time": "13:05:43", "remaining_time": "0:51:04"}
|
| 83 |
+
{"current_steps": 810, "total_steps": 852, "loss": 0.6269, "lr": 5e-06, "epoch": 2.8479789103690685, "percentage": 95.07, "elapsed_time": "13:15:23", "remaining_time": "0:41:14"}
|
| 84 |
+
{"current_steps": 820, "total_steps": 852, "loss": 0.6279, "lr": 5e-06, "epoch": 2.883128295254833, "percentage": 96.24, "elapsed_time": "13:25:03", "remaining_time": "0:31:25"}
|
| 85 |
+
{"current_steps": 830, "total_steps": 852, "loss": 0.6212, "lr": 5e-06, "epoch": 2.9182776801405974, "percentage": 97.42, "elapsed_time": "13:34:41", "remaining_time": "0:21:35"}
|
| 86 |
+
{"current_steps": 840, "total_steps": 852, "loss": 0.6282, "lr": 5e-06, "epoch": 2.953427065026362, "percentage": 98.59, "elapsed_time": "13:44:23", "remaining_time": "0:11:46"}
|
| 87 |
+
{"current_steps": 850, "total_steps": 852, "loss": 0.6277, "lr": 5e-06, "epoch": 2.9885764499121263, "percentage": 99.77, "elapsed_time": "13:54:04", "remaining_time": "0:01:57"}
|