Training in progress, epoch 1

Files changed (5) hide show

model-00001-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e8c1201bc149695d453824fad8f0107997f14e87075bf064fec51fa4b22005ab
 size 4976698672

 version https://git-lfs.github.com/spec/v1
+oid sha256:554244aec94ede1891c5897e8d55405ef0f2b242dcdd03f8a07024370aded9b5
 size 4976698672

model-00002-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:987629a6fdc6569fd0ec875b3f4706c4f99464ce1b4af7886f9d20c4cd766559
 size 4999802720

 version https://git-lfs.github.com/spec/v1
+oid sha256:89b60273e59ccbbde7feee830b59d8f891e32439b261f4448b6ff13b0a9d3a8c
 size 4999802720

model-00003-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:39f250e395da7a92b605742d55699b679ed43ce6f08705f379813f0b970e198d
 size 4915916176

 version https://git-lfs.github.com/spec/v1
+oid sha256:7750bc12cd1cceccc1a830075e2fe088f4c73614d11b60a76cf28833be552823
 size 4915916176

model-00004-of-00004.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b39bed45569e21fc66509b0fcd4fae907deccd8eb5d2e5e15ee6b4d9df92266a
 size 1168138808

 version https://git-lfs.github.com/spec/v1
+oid sha256:1e238d204f725fb028400a531a16690e989becb5c29fff3f4821303047fbc5d4
 size 1168138808

trainer_log.jsonl CHANGED Viewed

@@ -2,3 +2,7 @@
 {"current_steps": 20, "total_steps": 102, "loss": 0.7615, "lr": 5e-06, "epoch": 0.5871559633027523, "percentage": 19.61, "elapsed_time": "0:53:06", "remaining_time": "3:37:45"}
 {"current_steps": 30, "total_steps": 102, "loss": 0.7229, "lr": 5e-06, "epoch": 0.8807339449541285, "percentage": 29.41, "elapsed_time": "1:19:24", "remaining_time": "3:10:34"}
 {"current_steps": 34, "total_steps": 102, "eval_loss": 0.6932151913642883, "epoch": 0.998165137614679, "percentage": 33.33, "elapsed_time": "1:31:54", "remaining_time": "3:03:49"}

 {"current_steps": 20, "total_steps": 102, "loss": 0.7615, "lr": 5e-06, "epoch": 0.5871559633027523, "percentage": 19.61, "elapsed_time": "0:53:06", "remaining_time": "3:37:45"}
 {"current_steps": 30, "total_steps": 102, "loss": 0.7229, "lr": 5e-06, "epoch": 0.8807339449541285, "percentage": 29.41, "elapsed_time": "1:19:24", "remaining_time": "3:10:34"}
 {"current_steps": 34, "total_steps": 102, "eval_loss": 0.6932151913642883, "epoch": 0.998165137614679, "percentage": 33.33, "elapsed_time": "1:31:54", "remaining_time": "3:03:49"}
+{"current_steps": 40, "total_steps": 102, "loss": 0.684, "lr": 5e-06, "epoch": 1.1743119266055047, "percentage": 39.22, "elapsed_time": "1:48:54", "remaining_time": "2:48:47"}
+{"current_steps": 50, "total_steps": 102, "loss": 0.6549, "lr": 5e-06, "epoch": 1.4678899082568808, "percentage": 49.02, "elapsed_time": "2:15:00", "remaining_time": "2:20:24"}
+{"current_steps": 60, "total_steps": 102, "loss": 0.6412, "lr": 5e-06, "epoch": 1.761467889908257, "percentage": 58.82, "elapsed_time": "2:41:06", "remaining_time": "1:52:46"}
+{"current_steps": 68, "total_steps": 102, "eval_loss": 0.6560695171356201, "epoch": 1.996330275229358, "percentage": 66.67, "elapsed_time": "3:04:05", "remaining_time": "1:32:02"}