Training in progress, step 3400
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4902257696
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fc993fdd01a09b520ec832fb24610d1ce0e2842b765077f2674334bc6bfe18c8
|
| 3 |
size 4902257696
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915960368
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b1a1fe155a80d2ef486cc1906a123f619c30f1896659ae85741c33b3d0b598ce
|
| 3 |
size 4915960368
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4983068496
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:db48171ec06151fb4191ac2ecb6c537dbe0c9b4341e3d83f83a53af8304c17eb
|
| 3 |
size 4983068496
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1580230264
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7524fe06622c2ee77bab3c857718f6f3c14a72610b5db2f3cb64be410c7d7c2f
|
| 3 |
size 1580230264
|
trainer_log.jsonl
CHANGED
|
@@ -668,3 +668,15 @@
|
|
| 668 |
{"current_steps": 3330, "total_steps": 6188, "loss": 0.0882, "lr": 2.0840293624721234e-05, "epoch": 3.767402376910017, "percentage": 53.81, "elapsed_time": "2:02:49", "remaining_time": "1:45:24"}
|
| 669 |
{"current_steps": 3335, "total_steps": 6188, "loss": 0.0833, "lr": 2.0783928018781644e-05, "epoch": 3.77306168647425, "percentage": 53.89, "elapsed_time": "2:04:25", "remaining_time": "1:46:26"}
|
| 670 |
{"current_steps": 3340, "total_steps": 6188, "loss": 0.0882, "lr": 2.0727556176050676e-05, "epoch": 3.7787209960384835, "percentage": 53.98, "elapsed_time": "2:06:00", "remaining_time": "1:47:26"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 668 |
{"current_steps": 3330, "total_steps": 6188, "loss": 0.0882, "lr": 2.0840293624721234e-05, "epoch": 3.767402376910017, "percentage": 53.81, "elapsed_time": "2:02:49", "remaining_time": "1:45:24"}
|
| 669 |
{"current_steps": 3335, "total_steps": 6188, "loss": 0.0833, "lr": 2.0783928018781644e-05, "epoch": 3.77306168647425, "percentage": 53.89, "elapsed_time": "2:04:25", "remaining_time": "1:46:26"}
|
| 670 |
{"current_steps": 3340, "total_steps": 6188, "loss": 0.0882, "lr": 2.0727556176050676e-05, "epoch": 3.7787209960384835, "percentage": 53.98, "elapsed_time": "2:06:00", "remaining_time": "1:47:26"}
|
| 671 |
+
{"current_steps": 3345, "total_steps": 6188, "loss": 0.0945, "lr": 2.0671178545012643e-05, "epoch": 3.7843803056027165, "percentage": 54.06, "elapsed_time": "2:07:36", "remaining_time": "1:48:27"}
|
| 672 |
+
{"current_steps": 3350, "total_steps": 6188, "loss": 0.101, "lr": 2.0614795574197907e-05, "epoch": 3.7900396151669495, "percentage": 54.14, "elapsed_time": "2:09:25", "remaining_time": "1:49:38"}
|
| 673 |
+
{"current_steps": 3355, "total_steps": 6188, "loss": 0.0925, "lr": 2.0558407712179334e-05, "epoch": 3.795698924731183, "percentage": 54.22, "elapsed_time": "2:11:01", "remaining_time": "1:50:38"}
|
| 674 |
+
{"current_steps": 3360, "total_steps": 6188, "loss": 0.1026, "lr": 2.050201540756868e-05, "epoch": 3.801358234295416, "percentage": 54.3, "elapsed_time": "2:12:30", "remaining_time": "1:51:31"}
|
| 675 |
+
{"current_steps": 3365, "total_steps": 6188, "loss": 0.1105, "lr": 2.0445619109013054e-05, "epoch": 3.807017543859649, "percentage": 54.38, "elapsed_time": "2:14:33", "remaining_time": "1:52:52"}
|
| 676 |
+
{"current_steps": 3370, "total_steps": 6188, "loss": 0.0871, "lr": 2.038921926519134e-05, "epoch": 3.8126768534238824, "percentage": 54.46, "elapsed_time": "2:16:08", "remaining_time": "1:53:50"}
|
| 677 |
+
{"current_steps": 3375, "total_steps": 6188, "loss": 0.0755, "lr": 2.033281632481063e-05, "epoch": 3.8183361629881154, "percentage": 54.54, "elapsed_time": "2:17:41", "remaining_time": "1:54:45"}
|
| 678 |
+
{"current_steps": 3380, "total_steps": 6188, "loss": 0.0889, "lr": 2.027641073660265e-05, "epoch": 3.8239954725523484, "percentage": 54.62, "elapsed_time": "2:19:12", "remaining_time": "1:55:39"}
|
| 679 |
+
{"current_steps": 3385, "total_steps": 6188, "loss": 0.1151, "lr": 2.0220002949320187e-05, "epoch": 3.829654782116582, "percentage": 54.7, "elapsed_time": "2:21:16", "remaining_time": "1:56:59"}
|
| 680 |
+
{"current_steps": 3390, "total_steps": 6188, "loss": 0.0715, "lr": 2.0163593411733533e-05, "epoch": 3.835314091680815, "percentage": 54.78, "elapsed_time": "2:22:46", "remaining_time": "1:57:50"}
|
| 681 |
+
{"current_steps": 3395, "total_steps": 6188, "loss": 0.0893, "lr": 2.0107182572626897e-05, "epoch": 3.8409734012450483, "percentage": 54.86, "elapsed_time": "2:24:48", "remaining_time": "1:59:08"}
|
| 682 |
+
{"current_steps": 3400, "total_steps": 6188, "loss": 0.0863, "lr": 2.0050770880794843e-05, "epoch": 3.8466327108092813, "percentage": 54.95, "elapsed_time": "2:26:30", "remaining_time": "2:00:07"}
|