Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a746ce57a143285df0995e2c303c0788e992f64bf845a1eea9ba6ad07ca8f885
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:094c2740982f3d968f2a165b29e4072697bdd2bed1bc055a97db6c024804f4bc
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d9f124e5da760974f5acfc6e31d6363342aefde9507dab1d91ed68f286f530c5
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5af6f28757c25fbbaf0500d437b73effec793601270c2ae6bbaff05e6a3dfb26
|
| 3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
|
@@ -65,3 +65,36 @@
|
|
| 65 |
{"current_steps": 640, "total_steps": 981, "loss": 0.7075, "lr": 5e-06, "epoch": 1.9564386702330914, "percentage": 65.24, "elapsed_time": "10:25:02", "remaining_time": "5:33:01"}
|
| 66 |
{"current_steps": 650, "total_steps": 981, "loss": 0.7082, "lr": 5e-06, "epoch": 1.9870080244554833, "percentage": 66.26, "elapsed_time": "10:34:41", "remaining_time": "5:23:12"}
|
| 67 |
{"current_steps": 654, "total_steps": 981, "eval_loss": 0.7433667182922363, "epoch": 1.9992357661444402, "percentage": 66.67, "elapsed_time": "10:44:34", "remaining_time": "5:22:17"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 65 |
{"current_steps": 640, "total_steps": 981, "loss": 0.7075, "lr": 5e-06, "epoch": 1.9564386702330914, "percentage": 65.24, "elapsed_time": "10:25:02", "remaining_time": "5:33:01"}
|
| 66 |
{"current_steps": 650, "total_steps": 981, "loss": 0.7082, "lr": 5e-06, "epoch": 1.9870080244554833, "percentage": 66.26, "elapsed_time": "10:34:41", "remaining_time": "5:23:12"}
|
| 67 |
{"current_steps": 654, "total_steps": 981, "eval_loss": 0.7433667182922363, "epoch": 1.9992357661444402, "percentage": 66.67, "elapsed_time": "10:44:34", "remaining_time": "5:22:17"}
|
| 68 |
+
{"current_steps": 660, "total_steps": 981, "loss": 0.7384, "lr": 5e-06, "epoch": 2.0175773786778755, "percentage": 67.28, "elapsed_time": "10:51:20", "remaining_time": "5:16:47"}
|
| 69 |
+
{"current_steps": 670, "total_steps": 981, "loss": 0.6584, "lr": 5e-06, "epoch": 2.0481467329002676, "percentage": 68.3, "elapsed_time": "11:00:57", "remaining_time": "5:06:48"}
|
| 70 |
+
{"current_steps": 680, "total_steps": 981, "loss": 0.6626, "lr": 5e-06, "epoch": 2.0787160871226593, "percentage": 69.32, "elapsed_time": "11:10:38", "remaining_time": "4:56:51"}
|
| 71 |
+
{"current_steps": 690, "total_steps": 981, "loss": 0.6584, "lr": 5e-06, "epoch": 2.1092854413450515, "percentage": 70.34, "elapsed_time": "11:20:18", "remaining_time": "4:46:54"}
|
| 72 |
+
{"current_steps": 700, "total_steps": 981, "loss": 0.6637, "lr": 5e-06, "epoch": 2.1398547955674436, "percentage": 71.36, "elapsed_time": "11:29:57", "remaining_time": "4:36:58"}
|
| 73 |
+
{"current_steps": 710, "total_steps": 981, "loss": 0.664, "lr": 5e-06, "epoch": 2.1704241497898358, "percentage": 72.38, "elapsed_time": "11:39:37", "remaining_time": "4:27:02"}
|
| 74 |
+
{"current_steps": 720, "total_steps": 981, "loss": 0.6639, "lr": 5e-06, "epoch": 2.200993504012228, "percentage": 73.39, "elapsed_time": "11:49:18", "remaining_time": "4:17:07"}
|
| 75 |
+
{"current_steps": 730, "total_steps": 981, "loss": 0.6644, "lr": 5e-06, "epoch": 2.2315628582346196, "percentage": 74.41, "elapsed_time": "11:58:56", "remaining_time": "4:07:12"}
|
| 76 |
+
{"current_steps": 740, "total_steps": 981, "loss": 0.6597, "lr": 5e-06, "epoch": 2.262132212457012, "percentage": 75.43, "elapsed_time": "12:08:35", "remaining_time": "3:57:16"}
|
| 77 |
+
{"current_steps": 750, "total_steps": 981, "loss": 0.6649, "lr": 5e-06, "epoch": 2.292701566679404, "percentage": 76.45, "elapsed_time": "12:18:13", "remaining_time": "3:47:22"}
|
| 78 |
+
{"current_steps": 760, "total_steps": 981, "loss": 0.6659, "lr": 5e-06, "epoch": 2.323270920901796, "percentage": 77.47, "elapsed_time": "12:27:51", "remaining_time": "3:37:28"}
|
| 79 |
+
{"current_steps": 770, "total_steps": 981, "loss": 0.663, "lr": 5e-06, "epoch": 2.353840275124188, "percentage": 78.49, "elapsed_time": "12:37:30", "remaining_time": "3:27:34"}
|
| 80 |
+
{"current_steps": 780, "total_steps": 981, "loss": 0.6615, "lr": 5e-06, "epoch": 2.38440962934658, "percentage": 79.51, "elapsed_time": "12:47:10", "remaining_time": "3:17:41"}
|
| 81 |
+
{"current_steps": 790, "total_steps": 981, "loss": 0.6668, "lr": 5e-06, "epoch": 2.414978983568972, "percentage": 80.53, "elapsed_time": "12:56:50", "remaining_time": "3:07:49"}
|
| 82 |
+
{"current_steps": 800, "total_steps": 981, "loss": 0.6652, "lr": 5e-06, "epoch": 2.4455483377913643, "percentage": 81.55, "elapsed_time": "13:06:30", "remaining_time": "2:57:56"}
|
| 83 |
+
{"current_steps": 810, "total_steps": 981, "loss": 0.6658, "lr": 5e-06, "epoch": 2.476117692013756, "percentage": 82.57, "elapsed_time": "13:16:09", "remaining_time": "2:48:04"}
|
| 84 |
+
{"current_steps": 820, "total_steps": 981, "loss": 0.6652, "lr": 5e-06, "epoch": 2.506687046236148, "percentage": 83.59, "elapsed_time": "13:25:47", "remaining_time": "2:38:12"}
|
| 85 |
+
{"current_steps": 830, "total_steps": 981, "loss": 0.6667, "lr": 5e-06, "epoch": 2.5372564004585403, "percentage": 84.61, "elapsed_time": "13:35:26", "remaining_time": "2:28:21"}
|
| 86 |
+
{"current_steps": 840, "total_steps": 981, "loss": 0.6675, "lr": 5e-06, "epoch": 2.5678257546809324, "percentage": 85.63, "elapsed_time": "13:45:07", "remaining_time": "2:18:30"}
|
| 87 |
+
{"current_steps": 850, "total_steps": 981, "loss": 0.6645, "lr": 5e-06, "epoch": 2.5983951089033246, "percentage": 86.65, "elapsed_time": "13:54:45", "remaining_time": "2:08:38"}
|
| 88 |
+
{"current_steps": 860, "total_steps": 981, "loss": 0.6632, "lr": 5e-06, "epoch": 2.6289644631257163, "percentage": 87.67, "elapsed_time": "14:04:25", "remaining_time": "1:58:48"}
|
| 89 |
+
{"current_steps": 870, "total_steps": 981, "loss": 0.668, "lr": 5e-06, "epoch": 2.6595338173481085, "percentage": 88.69, "elapsed_time": "14:14:05", "remaining_time": "1:48:58"}
|
| 90 |
+
{"current_steps": 880, "total_steps": 981, "loss": 0.668, "lr": 5e-06, "epoch": 2.6901031715705006, "percentage": 89.7, "elapsed_time": "14:23:45", "remaining_time": "1:39:08"}
|
| 91 |
+
{"current_steps": 890, "total_steps": 981, "loss": 0.6673, "lr": 5e-06, "epoch": 2.7206725257928928, "percentage": 90.72, "elapsed_time": "14:33:25", "remaining_time": "1:29:18"}
|
| 92 |
+
{"current_steps": 900, "total_steps": 981, "loss": 0.6682, "lr": 5e-06, "epoch": 2.751241880015285, "percentage": 91.74, "elapsed_time": "14:43:04", "remaining_time": "1:19:28"}
|
| 93 |
+
{"current_steps": 910, "total_steps": 981, "loss": 0.6654, "lr": 5e-06, "epoch": 2.7818112342376766, "percentage": 92.76, "elapsed_time": "14:52:43", "remaining_time": "1:09:39"}
|
| 94 |
+
{"current_steps": 920, "total_steps": 981, "loss": 0.6644, "lr": 5e-06, "epoch": 2.8123805884600688, "percentage": 93.78, "elapsed_time": "15:02:24", "remaining_time": "0:59:49"}
|
| 95 |
+
{"current_steps": 930, "total_steps": 981, "loss": 0.6662, "lr": 5e-06, "epoch": 2.842949942682461, "percentage": 94.8, "elapsed_time": "15:12:04", "remaining_time": "0:50:01"}
|
| 96 |
+
{"current_steps": 940, "total_steps": 981, "loss": 0.6663, "lr": 5e-06, "epoch": 2.8735192969048526, "percentage": 95.82, "elapsed_time": "15:21:44", "remaining_time": "0:40:12"}
|
| 97 |
+
{"current_steps": 950, "total_steps": 981, "loss": 0.6658, "lr": 5e-06, "epoch": 2.904088651127245, "percentage": 96.84, "elapsed_time": "15:31:24", "remaining_time": "0:30:23"}
|
| 98 |
+
{"current_steps": 960, "total_steps": 981, "loss": 0.667, "lr": 5e-06, "epoch": 2.934658005349637, "percentage": 97.86, "elapsed_time": "15:41:04", "remaining_time": "0:20:35"}
|
| 99 |
+
{"current_steps": 970, "total_steps": 981, "loss": 0.6669, "lr": 5e-06, "epoch": 2.965227359572029, "percentage": 98.88, "elapsed_time": "15:50:45", "remaining_time": "0:10:46"}
|
| 100 |
+
{"current_steps": 980, "total_steps": 981, "loss": 0.6679, "lr": 5e-06, "epoch": 2.9957967137944213, "percentage": 99.9, "elapsed_time": "16:00:25", "remaining_time": "0:00:58"}
|