Training in progress, epoch 2

Files changed (5) hide show

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bc13626b142a066c6768de5d75e7ac643d2286bc9f9c3f39b29777c47c5adc0a
 size 4976698672

 version https://git-lfs.github.com/spec/v1
+oid sha256:f19856a1e8c1b5d59c228fa083db4efbae8a697ddae9459cb4be66e2eb8a4db6
 size 4976698672

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:84740073de871bfee3508f3717f1d8562cf8fc5df3f2eea750def81595d51c88
 size 4999802720

 version https://git-lfs.github.com/spec/v1
+oid sha256:2cbab3c2438931f42949da3f3d7c46971991fec6cf53d0c7d433927cb1d9a77e
 size 4999802720

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f5b22378f9928194214456164606dd4f6f16bffbe343a2ca3d01d438b2409357
 size 4915916176

 version https://git-lfs.github.com/spec/v1
+oid sha256:8d8e732c9070365f668a83e45569ed681cc0f21fc2041e808998874ee654e917
 size 4915916176

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:98abc91bf3e78bc9166bac8ebbdf730300ce6993fa0a202497f099cbd41f3b15
 size 1168138808

 version https://git-lfs.github.com/spec/v1
+oid sha256:e3d5e3c00a34ab4a8c61c2ba9a39b101ab6a2a97ce8d3275427bc750b0f38463
 size 1168138808

trainer_log.jsonl CHANGED Viewed

@@ -2,3 +2,8 @@
 {"current_steps": 20, "total_steps": 105, "loss": 0.8918, "lr": 5e-06, "epoch": 0.5714285714285714, "percentage": 19.05, "elapsed_time": "0:51:48", "remaining_time": "3:40:09"}
 {"current_steps": 30, "total_steps": 105, "loss": 0.853, "lr": 5e-06, "epoch": 0.8571428571428571, "percentage": 28.57, "elapsed_time": "1:17:39", "remaining_time": "3:14:09"}
 {"current_steps": 35, "total_steps": 105, "eval_loss": 0.8312212824821472, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "1:32:23", "remaining_time": "3:04:46"}

 {"current_steps": 20, "total_steps": 105, "loss": 0.8918, "lr": 5e-06, "epoch": 0.5714285714285714, "percentage": 19.05, "elapsed_time": "0:51:48", "remaining_time": "3:40:09"}
 {"current_steps": 30, "total_steps": 105, "loss": 0.853, "lr": 5e-06, "epoch": 0.8571428571428571, "percentage": 28.57, "elapsed_time": "1:17:39", "remaining_time": "3:14:09"}
 {"current_steps": 35, "total_steps": 105, "eval_loss": 0.8312212824821472, "epoch": 1.0, "percentage": 33.33, "elapsed_time": "1:32:23", "remaining_time": "3:04:46"}
+{"current_steps": 40, "total_steps": 105, "loss": 0.8164, "lr": 5e-06, "epoch": 1.1428571428571428, "percentage": 38.1, "elapsed_time": "1:46:40", "remaining_time": "2:53:21"}
+{"current_steps": 50, "total_steps": 105, "loss": 0.7836, "lr": 5e-06, "epoch": 1.4285714285714286, "percentage": 47.62, "elapsed_time": "2:12:31", "remaining_time": "2:25:46"}
+{"current_steps": 60, "total_steps": 105, "loss": 0.7806, "lr": 5e-06, "epoch": 1.7142857142857144, "percentage": 57.14, "elapsed_time": "2:38:22", "remaining_time": "1:58:46"}
+{"current_steps": 70, "total_steps": 105, "loss": 0.7709, "lr": 5e-06, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "3:04:13", "remaining_time": "1:32:06"}
+{"current_steps": 70, "total_steps": 105, "eval_loss": 0.8022096753120422, "epoch": 2.0, "percentage": 66.67, "elapsed_time": "3:06:02", "remaining_time": "1:33:01"}