Training in progress, epoch 2

Browse files

Files changed (5) hide show

model-00001-of-00004.safetensors +1 -1
model-00002-of-00004.safetensors +1 -1
model-00003-of-00004.safetensors +1 -1
model-00004-of-00004.safetensors +1 -1
trainer_log.jsonl +17 -0

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e647bc20fd433b24625114790f9e69e8bb45a8717aac313a9cee2e1f4b5deec4
 size 4976698672

 version https://git-lfs.github.com/spec/v1
+oid sha256:3a6e779afcc3dd063450f41d163042ee61c114fd52ebf27ed4dce854416c4dc4
 size 4976698672

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f5d20921fbfeecee24dd4eb1350f3f5bdebad235fc88a8c528a158f70a305d92
 size 4999802720

 version https://git-lfs.github.com/spec/v1
+oid sha256:965bd6a3e77b7215f64703a397579790961052df0dfb4a4e11121bf4c431da4a
 size 4999802720

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dfc780e8a17ce70fe0e5ff8003728d506ccb762623c502fc735ef1567c2323ee
 size 4915916176

 version https://git-lfs.github.com/spec/v1
+oid sha256:a3c7eb8cbc926b31d653770c13b396d7a46f151a6b00dcc5c3d682f9ecf5716b
 size 4915916176

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d85f009124922b03455f6750bfa74a5fd707b5d0db66457a02e7b1f802a31ed5
 size 1168138808

 version https://git-lfs.github.com/spec/v1
+oid sha256:e1edd53054da16982db7b30edf97e505684b42ad6bf577709c5e18d22022c54c
 size 1168138808

trainer_log.jsonl CHANGED Viewed

@@ -32,3 +32,20 @@
 {"current_steps": 310, "total_steps": 480, "loss": 0.4789, "lr": 5e-06, "epoch": 1.9359875097580015, "percentage": 64.58, "elapsed_time": "2:48:44", "remaining_time": "1:32:31"}
 {"current_steps": 320, "total_steps": 480, "loss": 0.4787, "lr": 5e-06, "epoch": 1.9984387197501952, "percentage": 66.67, "elapsed_time": "2:54:06", "remaining_time": "1:27:03"}
 {"current_steps": 320, "total_steps": 480, "eval_loss": 0.5198609828948975, "epoch": 1.9984387197501952, "percentage": 66.67, "elapsed_time": "2:56:03", "remaining_time": "1:28:01"}

 {"current_steps": 310, "total_steps": 480, "loss": 0.4789, "lr": 5e-06, "epoch": 1.9359875097580015, "percentage": 64.58, "elapsed_time": "2:48:44", "remaining_time": "1:32:31"}
 {"current_steps": 320, "total_steps": 480, "loss": 0.4787, "lr": 5e-06, "epoch": 1.9984387197501952, "percentage": 66.67, "elapsed_time": "2:54:06", "remaining_time": "1:27:03"}
 {"current_steps": 320, "total_steps": 480, "eval_loss": 0.5198609828948975, "epoch": 1.9984387197501952, "percentage": 66.67, "elapsed_time": "2:56:03", "remaining_time": "1:28:01"}
+{"current_steps": 330, "total_steps": 480, "loss": 0.4873, "lr": 5e-06, "epoch": 2.060889929742389, "percentage": 68.75, "elapsed_time": "3:02:31", "remaining_time": "1:22:58"}
+{"current_steps": 340, "total_steps": 480, "loss": 0.4362, "lr": 5e-06, "epoch": 2.1233411397345825, "percentage": 70.83, "elapsed_time": "3:07:49", "remaining_time": "1:17:20"}
+{"current_steps": 350, "total_steps": 480, "loss": 0.4425, "lr": 5e-06, "epoch": 2.185792349726776, "percentage": 72.92, "elapsed_time": "3:13:09", "remaining_time": "1:11:44"}
+{"current_steps": 360, "total_steps": 480, "loss": 0.4355, "lr": 5e-06, "epoch": 2.2482435597189694, "percentage": 75.0, "elapsed_time": "3:18:30", "remaining_time": "1:06:10"}
+{"current_steps": 370, "total_steps": 480, "loss": 0.4384, "lr": 5e-06, "epoch": 2.310694769711163, "percentage": 77.08, "elapsed_time": "3:23:49", "remaining_time": "1:00:35"}
+{"current_steps": 380, "total_steps": 480, "loss": 0.4381, "lr": 5e-06, "epoch": 2.3731459797033567, "percentage": 79.17, "elapsed_time": "3:29:06", "remaining_time": "0:55:01"}
+{"current_steps": 390, "total_steps": 480, "loss": 0.4425, "lr": 5e-06, "epoch": 2.4355971896955504, "percentage": 81.25, "elapsed_time": "3:34:23", "remaining_time": "0:49:28"}
+{"current_steps": 400, "total_steps": 480, "loss": 0.4439, "lr": 5e-06, "epoch": 2.498048399687744, "percentage": 83.33, "elapsed_time": "3:39:44", "remaining_time": "0:43:56"}
+{"current_steps": 410, "total_steps": 480, "loss": 0.4434, "lr": 5e-06, "epoch": 2.5604996096799377, "percentage": 85.42, "elapsed_time": "3:45:03", "remaining_time": "0:38:25"}
+{"current_steps": 420, "total_steps": 480, "loss": 0.4376, "lr": 5e-06, "epoch": 2.6229508196721314, "percentage": 87.5, "elapsed_time": "3:50:22", "remaining_time": "0:32:54"}
+{"current_steps": 430, "total_steps": 480, "loss": 0.4418, "lr": 5e-06, "epoch": 2.6854020296643246, "percentage": 89.58, "elapsed_time": "3:55:42", "remaining_time": "0:27:24"}
+{"current_steps": 440, "total_steps": 480, "loss": 0.4489, "lr": 5e-06, "epoch": 2.7478532396565183, "percentage": 91.67, "elapsed_time": "4:00:59", "remaining_time": "0:21:54"}
+{"current_steps": 450, "total_steps": 480, "loss": 0.4446, "lr": 5e-06, "epoch": 2.810304449648712, "percentage": 93.75, "elapsed_time": "4:06:16", "remaining_time": "0:16:25"}
+{"current_steps": 460, "total_steps": 480, "loss": 0.4427, "lr": 5e-06, "epoch": 2.8727556596409056, "percentage": 95.83, "elapsed_time": "4:11:35", "remaining_time": "0:10:56"}
+{"current_steps": 470, "total_steps": 480, "loss": 0.4448, "lr": 5e-06, "epoch": 2.9352068696330993, "percentage": 97.92, "elapsed_time": "4:16:54", "remaining_time": "0:05:27"}
+{"current_steps": 480, "total_steps": 480, "loss": 0.443, "lr": 5e-06, "epoch": 2.9976580796252925, "percentage": 100.0, "elapsed_time": "4:22:12", "remaining_time": "0:00:00"}
+{"current_steps": 480, "total_steps": 480, "eval_loss": 0.5204988121986389, "epoch": 2.9976580796252925, "percentage": 100.0, "elapsed_time": "4:25:17", "remaining_time": "0:00:00"}