Training in progress, step 288
Browse files- model-00001-of-00002.safetensors +1 -1
- model-00002-of-00002.safetensors +1 -1
- trainer_log.jsonl +17 -0
model-00001-of-00002.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4969539560
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ad5883a3cee7c47736b45f9790afc68bdd5c731da8985e21a6cb6b18802bee1
|
| 3 |
size 4969539560
|
model-00002-of-00002.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1912795688
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:652f38f7fb6d6d424d146395fc676655eef11c276b4cc3a9e7a2d7d530069500
|
| 3 |
size 1912795688
|
trainer_log.jsonl
CHANGED
|
@@ -781,3 +781,20 @@
|
|
| 781 |
{"current_steps": 287, "total_steps": 400, "loss": 0.6352, "lr": 3.049124342432378e-08, "epoch": 71.87272727272727, "percentage": 71.75, "elapsed_time": "0:34:54", "remaining_time": "0:13:44"}
|
| 782 |
{"current_steps": 288, "total_steps": 400, "loss": 0.6391, "lr": 3.0162835660957385e-08, "epoch": 72.0, "percentage": 72.0, "elapsed_time": "0:34:57", "remaining_time": "0:13:35"}
|
| 783 |
{"current_steps": 288, "total_steps": 400, "eval_loss": 0.641921877861023, "epoch": 72.0, "percentage": 72.0, "elapsed_time": "0:34:58", "remaining_time": "0:13:36"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 781 |
{"current_steps": 287, "total_steps": 400, "loss": 0.6352, "lr": 3.049124342432378e-08, "epoch": 71.87272727272727, "percentage": 71.75, "elapsed_time": "0:34:54", "remaining_time": "0:13:44"}
|
| 782 |
{"current_steps": 288, "total_steps": 400, "loss": 0.6391, "lr": 3.0162835660957385e-08, "epoch": 72.0, "percentage": 72.0, "elapsed_time": "0:34:57", "remaining_time": "0:13:35"}
|
| 783 |
{"current_steps": 288, "total_steps": 400, "eval_loss": 0.641921877861023, "epoch": 72.0, "percentage": 72.0, "elapsed_time": "0:34:58", "remaining_time": "0:13:36"}
|
| 784 |
+
{"current_steps": 289, "total_steps": 400, "loss": 0.6219, "lr": 2.983631934381639e-08, "epoch": 72.2909090909091, "percentage": 72.25, "elapsed_time": "0:35:28", "remaining_time": "0:13:37"}
|
| 785 |
+
{"current_steps": 290, "total_steps": 400, "loss": 0.6635, "lr": 2.9511719338382535e-08, "epoch": 72.58181818181818, "percentage": 72.5, "elapsed_time": "0:35:35", "remaining_time": "0:13:30"}
|
| 786 |
+
{"current_steps": 291, "total_steps": 400, "loss": 0.6377, "lr": 2.918906036420294e-08, "epoch": 72.87272727272727, "percentage": 72.75, "elapsed_time": "0:35:42", "remaining_time": "0:13:22"}
|
| 787 |
+
{"current_steps": 292, "total_steps": 400, "loss": 0.7822, "lr": 2.886836699300771e-08, "epoch": 73.0, "percentage": 73.0, "elapsed_time": "0:35:45", "remaining_time": "0:13:13"}
|
| 788 |
+
{"current_steps": 293, "total_steps": 400, "loss": 0.609, "lr": 2.8549663646838718e-08, "epoch": 73.2909090909091, "percentage": 73.25, "elapsed_time": "0:35:52", "remaining_time": "0:13:06"}
|
| 789 |
+
{"current_steps": 294, "total_steps": 400, "loss": 0.6728, "lr": 2.8232974596189653e-08, "epoch": 73.58181818181818, "percentage": 73.5, "elapsed_time": "0:35:59", "remaining_time": "0:12:58"}
|
| 790 |
+
{"current_steps": 295, "total_steps": 400, "loss": 0.7013, "lr": 2.791832395815782e-08, "epoch": 73.87272727272727, "percentage": 73.75, "elapsed_time": "0:36:06", "remaining_time": "0:12:51"}
|
| 791 |
+
{"current_steps": 296, "total_steps": 400, "loss": 0.6343, "lr": 2.760573569460757e-08, "epoch": 74.0, "percentage": 74.0, "elapsed_time": "0:36:09", "remaining_time": "0:12:42"}
|
| 792 |
+
{"current_steps": 297, "total_steps": 400, "loss": 0.6528, "lr": 2.729523361034538e-08, "epoch": 74.2909090909091, "percentage": 74.25, "elapsed_time": "0:36:16", "remaining_time": "0:12:34"}
|
| 793 |
+
{"current_steps": 298, "total_steps": 400, "loss": 0.6243, "lr": 2.6986841351307128e-08, "epoch": 74.58181818181818, "percentage": 74.5, "elapsed_time": "0:36:23", "remaining_time": "0:12:27"}
|
| 794 |
+
{"current_steps": 299, "total_steps": 400, "loss": 0.6658, "lr": 2.6680582402757322e-08, "epoch": 74.87272727272727, "percentage": 74.75, "elapsed_time": "0:36:30", "remaining_time": "0:12:20"}
|
| 795 |
+
{"current_steps": 300, "total_steps": 400, "loss": 0.7016, "lr": 2.637648008750062e-08, "epoch": 75.0, "percentage": 75.0, "elapsed_time": "0:36:33", "remaining_time": "0:12:11"}
|
| 796 |
+
{"current_steps": 301, "total_steps": 400, "loss": 0.6661, "lr": 2.6074557564105726e-08, "epoch": 75.2909090909091, "percentage": 75.25, "elapsed_time": "0:36:40", "remaining_time": "0:12:03"}
|
| 797 |
+
{"current_steps": 302, "total_steps": 400, "loss": 0.6277, "lr": 2.5774837825141737e-08, "epoch": 75.58181818181818, "percentage": 75.5, "elapsed_time": "0:36:48", "remaining_time": "0:11:56"}
|
| 798 |
+
{"current_steps": 303, "total_steps": 400, "loss": 0.6863, "lr": 2.547734369542718e-08, "epoch": 75.87272727272727, "percentage": 75.75, "elapsed_time": "0:36:54", "remaining_time": "0:11:49"}
|
| 799 |
+
{"current_steps": 304, "total_steps": 400, "loss": 0.648, "lr": 2.5182097830291825e-08, "epoch": 76.0, "percentage": 76.0, "elapsed_time": "0:36:58", "remaining_time": "0:11:40"}
|
| 800 |
+
{"current_steps": 304, "total_steps": 400, "eval_loss": 0.6407743096351624, "epoch": 76.0, "percentage": 76.0, "elapsed_time": "0:36:58", "remaining_time": "0:11:40"}
|