Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4877660776
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ec76302756ab030af205239263a8cd486aecd80fee59c1e5820568260e18167
|
| 3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4932751008
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:485e6839dd50bc05c65204666e555d88287e2e58ba354d5c244ab9143a4726a2
|
| 3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4330865200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:338361d832951c14cba6203e4b19cd32b4231be25e5be19796a024f391cf9522
|
| 3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1089994880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:adf8c9004d4804af450f145b84d4405a54ce4ee3aa1c83569bb0622bb38f2412
|
| 3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
|
@@ -22,3 +22,10 @@
|
|
| 22 |
{"current_steps": 22, "total_steps": 30, "loss": 0.5769, "lr": 2.0142070414860704e-06, "epoch": 2.112, "percentage": 73.33, "elapsed_time": "0:21:42", "remaining_time": "0:07:53"}
|
| 23 |
{"current_steps": 23, "total_steps": 30, "loss": 0.5528, "lr": 1.5687918106563326e-06, "epoch": 2.208, "percentage": 76.67, "elapsed_time": "0:22:39", "remaining_time": "0:06:53"}
|
| 24 |
{"current_steps": 24, "total_steps": 30, "loss": 0.6085, "lr": 1.1697777844051105e-06, "epoch": 2.304, "percentage": 80.0, "elapsed_time": "0:23:29", "remaining_time": "0:05:52"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 22 |
{"current_steps": 22, "total_steps": 30, "loss": 0.5769, "lr": 2.0142070414860704e-06, "epoch": 2.112, "percentage": 73.33, "elapsed_time": "0:21:42", "remaining_time": "0:07:53"}
|
| 23 |
{"current_steps": 23, "total_steps": 30, "loss": 0.5528, "lr": 1.5687918106563326e-06, "epoch": 2.208, "percentage": 76.67, "elapsed_time": "0:22:39", "remaining_time": "0:06:53"}
|
| 24 |
{"current_steps": 24, "total_steps": 30, "loss": 0.6085, "lr": 1.1697777844051105e-06, "epoch": 2.304, "percentage": 80.0, "elapsed_time": "0:23:29", "remaining_time": "0:05:52"}
|
| 25 |
+
{"current_steps": 25, "total_steps": 30, "loss": 0.5401, "lr": 8.225609429353187e-07, "epoch": 2.4, "percentage": 83.33, "elapsed_time": "0:24:19", "remaining_time": "0:04:51"}
|
| 26 |
+
{"current_steps": 26, "total_steps": 30, "loss": 0.5971, "lr": 5.318367983829393e-07, "epoch": 2.496, "percentage": 86.67, "elapsed_time": "0:25:17", "remaining_time": "0:03:53"}
|
| 27 |
+
{"current_steps": 27, "total_steps": 30, "loss": 0.613, "lr": 3.015368960704584e-07, "epoch": 2.592, "percentage": 90.0, "elapsed_time": "0:26:05", "remaining_time": "0:02:53"}
|
| 28 |
+
{"current_steps": 28, "total_steps": 30, "loss": 0.5625, "lr": 1.3477564710088097e-07, "epoch": 2.6879999999999997, "percentage": 93.33, "elapsed_time": "0:27:06", "remaining_time": "0:01:56"}
|
| 29 |
+
{"current_steps": 29, "total_steps": 30, "loss": 0.539, "lr": 3.3808211290284886e-08, "epoch": 2.784, "percentage": 96.67, "elapsed_time": "0:28:03", "remaining_time": "0:00:58"}
|
| 30 |
+
{"current_steps": 30, "total_steps": 30, "loss": 0.5994, "lr": 0.0, "epoch": 2.88, "percentage": 100.0, "elapsed_time": "0:28:51", "remaining_time": "0:00:00"}
|
| 31 |
+
{"current_steps": 30, "total_steps": 30, "epoch": 2.88, "percentage": 100.0, "elapsed_time": "0:31:03", "remaining_time": "0:00:00"}
|