Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:eaa517f491c3d3da314d6fc8d569d38e3531440f688007adfff23ac120c6e26f
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:808dbe047d95738e1041d49f750773e21c25337195873976f1d9c5f26c7c8bce
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:52ac9fea3dbb07440bc7f612eb89ad63ab225f4ab97fbf07f392e645e10d3ba7
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:da17dea92315d0547f945f1eaed4720041584a3fa4f1f86df3564806a241732b
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -24,3 +24,8 @@
|
|
| 24 |
{"current_steps": 24, "total_steps": 30, "loss": 0.7032, "lr": 1.1697777844051105e-06, "epoch": 2.3125, "percentage": 80.0, "elapsed_time": "0:12:35", "remaining_time": "0:03:08"}
|
| 25 |
{"current_steps": 25, "total_steps": 30, "loss": 0.6561, "lr": 8.225609429353187e-07, "epoch": 2.40625, "percentage": 83.33, "elapsed_time": "0:13:07", "remaining_time": "0:02:37"}
|
| 26 |
{"current_steps": 26, "total_steps": 30, "loss": 0.6628, "lr": 5.318367983829393e-07, "epoch": 2.5, "percentage": 86.67, "elapsed_time": "0:13:30", "remaining_time": "0:02:04"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 24 |
{"current_steps": 24, "total_steps": 30, "loss": 0.7032, "lr": 1.1697777844051105e-06, "epoch": 2.3125, "percentage": 80.0, "elapsed_time": "0:12:35", "remaining_time": "0:03:08"}
|
| 25 |
{"current_steps": 25, "total_steps": 30, "loss": 0.6561, "lr": 8.225609429353187e-07, "epoch": 2.40625, "percentage": 83.33, "elapsed_time": "0:13:07", "remaining_time": "0:02:37"}
|
| 26 |
{"current_steps": 26, "total_steps": 30, "loss": 0.6628, "lr": 5.318367983829393e-07, "epoch": 2.5, "percentage": 86.67, "elapsed_time": "0:13:30", "remaining_time": "0:02:04"}
|
| 27 |
+
{"current_steps": 27, "total_steps": 30, "loss": 0.7113, "lr": 3.015368960704584e-07, "epoch": 2.59375, "percentage": 90.0, "elapsed_time": "0:13:57", "remaining_time": "0:01:33"}
|
| 28 |
+
{"current_steps": 28, "total_steps": 30, "loss": 0.6845, "lr": 1.3477564710088097e-07, "epoch": 2.6875, "percentage": 93.33, "elapsed_time": "0:14:29", "remaining_time": "0:01:02"}
|
| 29 |
+
{"current_steps": 29, "total_steps": 30, "loss": 0.6777, "lr": 3.3808211290284886e-08, "epoch": 2.78125, "percentage": 96.67, "elapsed_time": "0:15:01", "remaining_time": "0:00:31"}
|
| 30 |
+
{"current_steps": 30, "total_steps": 30, "loss": 0.6966, "lr": 0.0, "epoch": 2.875, "percentage": 100.0, "elapsed_time": "0:15:28", "remaining_time": "0:00:00"}
|
| 31 |
+
{"current_steps": 30, "total_steps": 30, "epoch": 2.875, "percentage": 100.0, "elapsed_time": "0:16:56", "remaining_time": "0:00:00"}
|