Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3a6e779afcc3dd063450f41d163042ee61c114fd52ebf27ed4dce854416c4dc4
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:965bd6a3e77b7215f64703a397579790961052df0dfb4a4e11121bf4c431da4a
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a3c7eb8cbc926b31d653770c13b396d7a46f151a6b00dcc5c3d682f9ecf5716b
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e1edd53054da16982db7b30edf97e505684b42ad6bf577709c5e18d22022c54c
|
| 3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
|
@@ -32,3 +32,20 @@
|
|
| 32 |
{"current_steps": 310, "total_steps": 480, "loss": 0.4789, "lr": 5e-06, "epoch": 1.9359875097580015, "percentage": 64.58, "elapsed_time": "2:48:44", "remaining_time": "1:32:31"}
|
| 33 |
{"current_steps": 320, "total_steps": 480, "loss": 0.4787, "lr": 5e-06, "epoch": 1.9984387197501952, "percentage": 66.67, "elapsed_time": "2:54:06", "remaining_time": "1:27:03"}
|
| 34 |
{"current_steps": 320, "total_steps": 480, "eval_loss": 0.5198609828948975, "epoch": 1.9984387197501952, "percentage": 66.67, "elapsed_time": "2:56:03", "remaining_time": "1:28:01"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 32 |
{"current_steps": 310, "total_steps": 480, "loss": 0.4789, "lr": 5e-06, "epoch": 1.9359875097580015, "percentage": 64.58, "elapsed_time": "2:48:44", "remaining_time": "1:32:31"}
|
| 33 |
{"current_steps": 320, "total_steps": 480, "loss": 0.4787, "lr": 5e-06, "epoch": 1.9984387197501952, "percentage": 66.67, "elapsed_time": "2:54:06", "remaining_time": "1:27:03"}
|
| 34 |
{"current_steps": 320, "total_steps": 480, "eval_loss": 0.5198609828948975, "epoch": 1.9984387197501952, "percentage": 66.67, "elapsed_time": "2:56:03", "remaining_time": "1:28:01"}
|
| 35 |
+
{"current_steps": 330, "total_steps": 480, "loss": 0.4873, "lr": 5e-06, "epoch": 2.060889929742389, "percentage": 68.75, "elapsed_time": "3:02:31", "remaining_time": "1:22:58"}
|
| 36 |
+
{"current_steps": 340, "total_steps": 480, "loss": 0.4362, "lr": 5e-06, "epoch": 2.1233411397345825, "percentage": 70.83, "elapsed_time": "3:07:49", "remaining_time": "1:17:20"}
|
| 37 |
+
{"current_steps": 350, "total_steps": 480, "loss": 0.4425, "lr": 5e-06, "epoch": 2.185792349726776, "percentage": 72.92, "elapsed_time": "3:13:09", "remaining_time": "1:11:44"}
|
| 38 |
+
{"current_steps": 360, "total_steps": 480, "loss": 0.4355, "lr": 5e-06, "epoch": 2.2482435597189694, "percentage": 75.0, "elapsed_time": "3:18:30", "remaining_time": "1:06:10"}
|
| 39 |
+
{"current_steps": 370, "total_steps": 480, "loss": 0.4384, "lr": 5e-06, "epoch": 2.310694769711163, "percentage": 77.08, "elapsed_time": "3:23:49", "remaining_time": "1:00:35"}
|
| 40 |
+
{"current_steps": 380, "total_steps": 480, "loss": 0.4381, "lr": 5e-06, "epoch": 2.3731459797033567, "percentage": 79.17, "elapsed_time": "3:29:06", "remaining_time": "0:55:01"}
|
| 41 |
+
{"current_steps": 390, "total_steps": 480, "loss": 0.4425, "lr": 5e-06, "epoch": 2.4355971896955504, "percentage": 81.25, "elapsed_time": "3:34:23", "remaining_time": "0:49:28"}
|
| 42 |
+
{"current_steps": 400, "total_steps": 480, "loss": 0.4439, "lr": 5e-06, "epoch": 2.498048399687744, "percentage": 83.33, "elapsed_time": "3:39:44", "remaining_time": "0:43:56"}
|
| 43 |
+
{"current_steps": 410, "total_steps": 480, "loss": 0.4434, "lr": 5e-06, "epoch": 2.5604996096799377, "percentage": 85.42, "elapsed_time": "3:45:03", "remaining_time": "0:38:25"}
|
| 44 |
+
{"current_steps": 420, "total_steps": 480, "loss": 0.4376, "lr": 5e-06, "epoch": 2.6229508196721314, "percentage": 87.5, "elapsed_time": "3:50:22", "remaining_time": "0:32:54"}
|
| 45 |
+
{"current_steps": 430, "total_steps": 480, "loss": 0.4418, "lr": 5e-06, "epoch": 2.6854020296643246, "percentage": 89.58, "elapsed_time": "3:55:42", "remaining_time": "0:27:24"}
|
| 46 |
+
{"current_steps": 440, "total_steps": 480, "loss": 0.4489, "lr": 5e-06, "epoch": 2.7478532396565183, "percentage": 91.67, "elapsed_time": "4:00:59", "remaining_time": "0:21:54"}
|
| 47 |
+
{"current_steps": 450, "total_steps": 480, "loss": 0.4446, "lr": 5e-06, "epoch": 2.810304449648712, "percentage": 93.75, "elapsed_time": "4:06:16", "remaining_time": "0:16:25"}
|
| 48 |
+
{"current_steps": 460, "total_steps": 480, "loss": 0.4427, "lr": 5e-06, "epoch": 2.8727556596409056, "percentage": 95.83, "elapsed_time": "4:11:35", "remaining_time": "0:10:56"}
|
| 49 |
+
{"current_steps": 470, "total_steps": 480, "loss": 0.4448, "lr": 5e-06, "epoch": 2.9352068696330993, "percentage": 97.92, "elapsed_time": "4:16:54", "remaining_time": "0:05:27"}
|
| 50 |
+
{"current_steps": 480, "total_steps": 480, "loss": 0.443, "lr": 5e-06, "epoch": 2.9976580796252925, "percentage": 100.0, "elapsed_time": "4:22:12", "remaining_time": "0:00:00"}
|
| 51 |
+
{"current_steps": 480, "total_steps": 480, "eval_loss": 0.5204988121986389, "epoch": 2.9976580796252925, "percentage": 100.0, "elapsed_time": "4:25:17", "remaining_time": "0:00:00"}
|