Training in progress, epoch 1
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4eaae1741a1d0234c89719a2643feadbc868e24f09b0c31241c0d57ac7aebbbe
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:537c0ba8796466458d7b994096971d4603aac003b0788ba9d8c5cfddf73bdf57
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:90b827c366e55055ef35cd22b7289e353919f343bc7d35ed07277fb956750a81
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a9ab0769c89106d4b7b4bb69507b68aa558166bed24b174ff6b2e07f33b4f399
|
| 3 |
size 1168138808
|
trainer_log.jsonl
CHANGED
|
@@ -2,3 +2,7 @@
|
|
| 2 |
{"current_steps": 20, "total_steps": 87, "loss": 1.1183, "lr": 5e-06, "epoch": 0.6866952789699571, "percentage": 22.99, "elapsed_time": "0:19:12", "remaining_time": "1:04:20"}
|
| 3 |
{"current_steps": 29, "total_steps": 87, "eval_loss": 1.0753060579299927, "epoch": 0.9957081545064378, "percentage": 33.33, "elapsed_time": "0:28:29", "remaining_time": "0:56:58"}
|
| 4 |
{"current_steps": 30, "total_steps": 87, "loss": 1.1737, "lr": 5e-06, "epoch": 1.0300429184549356, "percentage": 34.48, "elapsed_time": "0:30:27", "remaining_time": "0:57:51"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 2 |
{"current_steps": 20, "total_steps": 87, "loss": 1.1183, "lr": 5e-06, "epoch": 0.6866952789699571, "percentage": 22.99, "elapsed_time": "0:19:12", "remaining_time": "1:04:20"}
|
| 3 |
{"current_steps": 29, "total_steps": 87, "eval_loss": 1.0753060579299927, "epoch": 0.9957081545064378, "percentage": 33.33, "elapsed_time": "0:28:29", "remaining_time": "0:56:58"}
|
| 4 |
{"current_steps": 30, "total_steps": 87, "loss": 1.1737, "lr": 5e-06, "epoch": 1.0300429184549356, "percentage": 34.48, "elapsed_time": "0:30:27", "remaining_time": "0:57:51"}
|
| 5 |
+
{"current_steps": 40, "total_steps": 87, "loss": 1.0339, "lr": 5e-06, "epoch": 1.3733905579399142, "percentage": 45.98, "elapsed_time": "0:40:03", "remaining_time": "0:47:03"}
|
| 6 |
+
{"current_steps": 50, "total_steps": 87, "loss": 1.0128, "lr": 5e-06, "epoch": 1.7167381974248928, "percentage": 57.47, "elapsed_time": "0:49:39", "remaining_time": "0:36:44"}
|
| 7 |
+
{"current_steps": 58, "total_steps": 87, "eval_loss": 1.036221981048584, "epoch": 1.9914163090128756, "percentage": 66.67, "elapsed_time": "0:58:04", "remaining_time": "0:29:02"}
|
| 8 |
+
{"current_steps": 60, "total_steps": 87, "loss": 1.0832, "lr": 5e-06, "epoch": 2.060085836909871, "percentage": 68.97, "elapsed_time": "1:00:57", "remaining_time": "0:27:25"}
|