Training in progress, step 400
Browse files- model.safetensors +1 -1
- trainer_log.jsonl +10 -0
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 3554214752
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fdbe330afff3ae1b094b65a537cb426c1c30fc7a4bf77a48c0987b5de61ca37e
|
| 3 |
size 3554214752
|
trainer_log.jsonl
CHANGED
|
@@ -28,3 +28,13 @@
|
|
| 28 |
{"current_steps": 280, "total_steps": 1931, "loss": 0.0292, "lr": 1.988206235503821e-05, "epoch": 0.14504014504014504, "percentage": 14.5, "elapsed_time": "4:27:23", "remaining_time": "1 day, 2:16:37"}
|
| 29 |
{"current_steps": 290, "total_steps": 1931, "loss": 0.0291, "lr": 1.98527522661065e-05, "epoch": 0.15022015022015023, "percentage": 15.02, "elapsed_time": "4:36:56", "remaining_time": "1 day, 2:07:05"}
|
| 30 |
{"current_steps": 300, "total_steps": 1931, "loss": 0.0284, "lr": 1.9820219284577052e-05, "epoch": 0.1554001554001554, "percentage": 15.54, "elapsed_time": "4:46:29", "remaining_time": "1 day, 1:57:32"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 28 |
{"current_steps": 280, "total_steps": 1931, "loss": 0.0292, "lr": 1.988206235503821e-05, "epoch": 0.14504014504014504, "percentage": 14.5, "elapsed_time": "4:27:23", "remaining_time": "1 day, 2:16:37"}
|
| 29 |
{"current_steps": 290, "total_steps": 1931, "loss": 0.0291, "lr": 1.98527522661065e-05, "epoch": 0.15022015022015023, "percentage": 15.02, "elapsed_time": "4:36:56", "remaining_time": "1 day, 2:07:05"}
|
| 30 |
{"current_steps": 300, "total_steps": 1931, "loss": 0.0284, "lr": 1.9820219284577052e-05, "epoch": 0.1554001554001554, "percentage": 15.54, "elapsed_time": "4:46:29", "remaining_time": "1 day, 1:57:32"}
|
| 31 |
+
{"current_steps": 310, "total_steps": 1931, "loss": 0.0277, "lr": 1.9784474052177435e-05, "epoch": 0.16058016058016059, "percentage": 16.05, "elapsed_time": "4:57:23", "remaining_time": "1 day, 1:55:01"}
|
| 32 |
+
{"current_steps": 320, "total_steps": 1931, "loss": 0.0277, "lr": 1.9745528261381156e-05, "epoch": 0.16576016576016575, "percentage": 16.57, "elapsed_time": "5:07:02", "remaining_time": "1 day, 1:45:48"}
|
| 33 |
+
{"current_steps": 330, "total_steps": 1931, "loss": 0.0272, "lr": 1.970339465158301e-05, "epoch": 0.17094017094017094, "percentage": 17.09, "elapsed_time": "5:16:19", "remaining_time": "1 day, 1:34:37"}
|
| 34 |
+
{"current_steps": 340, "total_steps": 1931, "loss": 0.0276, "lr": 1.9658087004931926e-05, "epoch": 0.1761201761201761, "percentage": 17.61, "elapsed_time": "5:25:57", "remaining_time": "1 day, 1:25:19"}
|
| 35 |
+
{"current_steps": 350, "total_steps": 1931, "loss": 0.0263, "lr": 1.960962014182276e-05, "epoch": 0.1813001813001813, "percentage": 18.13, "elapsed_time": "5:35:30", "remaining_time": "1 day, 1:15:34"}
|
| 36 |
+
{"current_steps": 360, "total_steps": 1931, "loss": 0.0267, "lr": 1.955800991604846e-05, "epoch": 0.1864801864801865, "percentage": 18.64, "elapsed_time": "5:45:08", "remaining_time": "1 day, 1:06:10"}
|
| 37 |
+
{"current_steps": 370, "total_steps": 1931, "loss": 0.0259, "lr": 1.9503273209614183e-05, "epoch": 0.19166019166019166, "percentage": 19.16, "elapsed_time": "5:54:34", "remaining_time": "1 day, 0:55:54"}
|
| 38 |
+
{"current_steps": 380, "total_steps": 1931, "loss": 0.0243, "lr": 1.9445427927215108e-05, "epoch": 0.19684019684019685, "percentage": 19.68, "elapsed_time": "6:03:57", "remaining_time": "1 day, 0:45:30"}
|
| 39 |
+
{"current_steps": 390, "total_steps": 1931, "loss": 0.0254, "lr": 1.9384492990379703e-05, "epoch": 0.20202020202020202, "percentage": 20.2, "elapsed_time": "6:13:19", "remaining_time": "1 day, 0:35:05"}
|
| 40 |
+
{"current_steps": 400, "total_steps": 1931, "loss": 0.024, "lr": 1.9320488331280372e-05, "epoch": 0.2072002072002072, "percentage": 20.71, "elapsed_time": "6:22:35", "remaining_time": "1 day, 0:24:23"}
|