Training in progress, step 368
Browse files- model-00001-of-00002.safetensors +1 -1
- model-00002-of-00002.safetensors +1 -1
- trainer_log.jsonl +17 -0
model-00001-of-00002.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4969539560
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9ceb02694688565e3a16da06ce91c5e882db4d780d31df5f10c2dea997b2c3ca
|
| 3 |
size 4969539560
|
model-00002-of-00002.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1912795688
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6db59088a0fb0851b5830cd0eb2bea70eda5332580952aa7bc75acee5ac2887e
|
| 3 |
size 1912795688
|
trainer_log.jsonl
CHANGED
|
@@ -866,3 +866,20 @@
|
|
| 866 |
{"current_steps": 367, "total_steps": 400, "loss": 0.6327, "lr": 1.1966285981663406e-08, "epoch": 91.87272727272727, "percentage": 91.75, "elapsed_time": "0:44:39", "remaining_time": "0:04:00"}
|
| 867 |
{"current_steps": 368, "total_steps": 400, "loss": 0.6545, "lr": 1.1853111930931313e-08, "epoch": 92.0, "percentage": 92.0, "elapsed_time": "0:44:42", "remaining_time": "0:03:53"}
|
| 868 |
{"current_steps": 368, "total_steps": 400, "eval_loss": 0.6371535062789917, "epoch": 92.0, "percentage": 92.0, "elapsed_time": "0:44:43", "remaining_time": "0:03:53"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 866 |
{"current_steps": 367, "total_steps": 400, "loss": 0.6327, "lr": 1.1966285981663406e-08, "epoch": 91.87272727272727, "percentage": 91.75, "elapsed_time": "0:44:39", "remaining_time": "0:04:00"}
|
| 867 |
{"current_steps": 368, "total_steps": 400, "loss": 0.6545, "lr": 1.1853111930931313e-08, "epoch": 92.0, "percentage": 92.0, "elapsed_time": "0:44:42", "remaining_time": "0:03:53"}
|
| 868 |
{"current_steps": 368, "total_steps": 400, "eval_loss": 0.6371535062789917, "epoch": 92.0, "percentage": 92.0, "elapsed_time": "0:44:43", "remaining_time": "0:03:53"}
|
| 869 |
+
{"current_steps": 369, "total_steps": 400, "loss": 0.5913, "lr": 1.174322368277565e-08, "epoch": 92.2909090909091, "percentage": 92.25, "elapsed_time": "0:45:15", "remaining_time": "0:03:48"}
|
| 870 |
+
{"current_steps": 370, "total_steps": 400, "loss": 0.6869, "lr": 1.1636629605611967e-08, "epoch": 92.58181818181818, "percentage": 92.5, "elapsed_time": "0:45:22", "remaining_time": "0:03:40"}
|
| 871 |
+
{"current_steps": 371, "total_steps": 400, "loss": 0.6699, "lr": 1.1533337816991931e-08, "epoch": 92.87272727272727, "percentage": 92.75, "elapsed_time": "0:45:29", "remaining_time": "0:03:33"}
|
| 872 |
+
{"current_steps": 372, "total_steps": 400, "loss": 0.658, "lr": 1.1433356182985158e-08, "epoch": 93.0, "percentage": 93.0, "elapsed_time": "0:45:32", "remaining_time": "0:03:25"}
|
| 873 |
+
{"current_steps": 373, "total_steps": 400, "loss": 0.7064, "lr": 1.133669231758016e-08, "epoch": 93.2909090909091, "percentage": 93.25, "elapsed_time": "0:45:40", "remaining_time": "0:03:18"}
|
| 874 |
+
{"current_steps": 374, "total_steps": 400, "loss": 0.6268, "lr": 1.1243353582104555e-08, "epoch": 93.58181818181818, "percentage": 93.5, "elapsed_time": "0:45:46", "remaining_time": "0:03:10"}
|
| 875 |
+
{"current_steps": 375, "total_steps": 400, "loss": 0.6366, "lr": 1.115334708466442e-08, "epoch": 93.87272727272727, "percentage": 93.75, "elapsed_time": "0:45:53", "remaining_time": "0:03:03"}
|
| 876 |
+
{"current_steps": 376, "total_steps": 400, "loss": 0.5847, "lr": 1.1066679679602998e-08, "epoch": 94.0, "percentage": 94.0, "elapsed_time": "0:45:56", "remaining_time": "0:02:55"}
|
| 877 |
+
{"current_steps": 377, "total_steps": 400, "loss": 0.6578, "lr": 1.0983357966978745e-08, "epoch": 94.2909090909091, "percentage": 94.25, "elapsed_time": "0:46:03", "remaining_time": "0:02:48"}
|
| 878 |
+
{"current_steps": 378, "total_steps": 400, "loss": 0.6523, "lr": 1.0903388292062667e-08, "epoch": 94.58181818181818, "percentage": 94.5, "elapsed_time": "0:46:10", "remaining_time": "0:02:41"}
|
| 879 |
+
{"current_steps": 379, "total_steps": 400, "loss": 0.6582, "lr": 1.0826776744855121e-08, "epoch": 94.87272727272727, "percentage": 94.75, "elapsed_time": "0:46:17", "remaining_time": "0:02:33"}
|
| 880 |
+
{"current_steps": 380, "total_steps": 400, "loss": 0.6047, "lr": 1.0753529159622047e-08, "epoch": 95.0, "percentage": 95.0, "elapsed_time": "0:46:20", "remaining_time": "0:02:26"}
|
| 881 |
+
{"current_steps": 381, "total_steps": 400, "loss": 0.6078, "lr": 1.068365111445064e-08, "epoch": 95.2909090909091, "percentage": 95.25, "elapsed_time": "0:46:26", "remaining_time": "0:02:18"}
|
| 882 |
+
{"current_steps": 382, "total_steps": 400, "loss": 0.6347, "lr": 1.0617147930824585e-08, "epoch": 95.58181818181818, "percentage": 95.5, "elapsed_time": "0:46:34", "remaining_time": "0:02:11"}
|
| 883 |
+
{"current_steps": 383, "total_steps": 400, "loss": 0.6709, "lr": 1.0554024673218806e-08, "epoch": 95.87272727272727, "percentage": 95.75, "elapsed_time": "0:46:40", "remaining_time": "0:02:04"}
|
| 884 |
+
{"current_steps": 384, "total_steps": 400, "loss": 0.7126, "lr": 1.0494286148713743e-08, "epoch": 96.0, "percentage": 96.0, "elapsed_time": "0:46:43", "remaining_time": "0:01:56"}
|
| 885 |
+
{"current_steps": 384, "total_steps": 400, "eval_loss": 0.6363654732704163, "epoch": 96.0, "percentage": 96.0, "elapsed_time": "0:46:44", "remaining_time": "0:01:56"}
|