Training in progress, step 1500
Browse files- model.safetensors +1 -1
- trainer_log.jsonl +10 -0
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 3554214752
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3ea753ab5b73dd533567770c7ac365fd3e2cb71665b6a7b1f53aec52e55b2f11
|
| 3 |
size 3554214752
|
trainer_log.jsonl
CHANGED
|
@@ -138,3 +138,13 @@
|
|
| 138 |
{"current_steps": 1380, "total_steps": 1931, "loss": 0.0153, "lr": 4.5832219557385896e-06, "epoch": 0.7148407148407149, "percentage": 71.47, "elapsed_time": "22:00:21", "remaining_time": "8:47:11"}
|
| 139 |
{"current_steps": 1390, "total_steps": 1931, "loss": 0.0153, "lr": 4.432085119077536e-06, "epoch": 0.72002072002072, "percentage": 71.98, "elapsed_time": "22:09:48", "remaining_time": "8:37:34"}
|
| 140 |
{"current_steps": 1400, "total_steps": 1931, "loss": 0.0153, "lr": 4.2827695797727835e-06, "epoch": 0.7252007252007252, "percentage": 72.5, "elapsed_time": "22:19:12", "remaining_time": "8:27:56"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 138 |
{"current_steps": 1380, "total_steps": 1931, "loss": 0.0153, "lr": 4.5832219557385896e-06, "epoch": 0.7148407148407149, "percentage": 71.47, "elapsed_time": "22:00:21", "remaining_time": "8:47:11"}
|
| 139 |
{"current_steps": 1390, "total_steps": 1931, "loss": 0.0153, "lr": 4.432085119077536e-06, "epoch": 0.72002072002072, "percentage": 71.98, "elapsed_time": "22:09:48", "remaining_time": "8:37:34"}
|
| 140 |
{"current_steps": 1400, "total_steps": 1931, "loss": 0.0153, "lr": 4.2827695797727835e-06, "epoch": 0.7252007252007252, "percentage": 72.5, "elapsed_time": "22:19:12", "remaining_time": "8:27:56"}
|
| 141 |
+
{"current_steps": 1410, "total_steps": 1931, "loss": 0.0158, "lr": 4.135324179806079e-06, "epoch": 0.7303807303807304, "percentage": 73.02, "elapsed_time": "22:30:16", "remaining_time": "8:18:56"}
|
| 142 |
+
{"current_steps": 1420, "total_steps": 1931, "loss": 0.0153, "lr": 3.989797149425714e-06, "epoch": 0.7355607355607355, "percentage": 73.54, "elapsed_time": "22:39:34", "remaining_time": "8:09:15"}
|
| 143 |
+
{"current_steps": 1430, "total_steps": 1931, "loss": 0.0154, "lr": 3.846236091370119e-06, "epoch": 0.7407407407407407, "percentage": 74.05, "elapsed_time": "22:48:58", "remaining_time": "7:59:37"}
|
| 144 |
+
{"current_steps": 1440, "total_steps": 1931, "loss": 0.0162, "lr": 3.704687965296746e-06, "epoch": 0.745920745920746, "percentage": 74.57, "elapsed_time": "22:58:33", "remaining_time": "7:50:02"}
|
| 145 |
+
{"current_steps": 1450, "total_steps": 1931, "loss": 0.0153, "lr": 3.5651990724212716e-06, "epoch": 0.7511007511007511, "percentage": 75.09, "elapsed_time": "23:07:56", "remaining_time": "7:40:24"}
|
| 146 |
+
{"current_steps": 1460, "total_steps": 1931, "loss": 0.0155, "lr": 3.4278150403722222e-06, "epoch": 0.7562807562807563, "percentage": 75.61, "elapsed_time": "23:17:21", "remaining_time": "7:30:47"}
|
| 147 |
+
{"current_steps": 1470, "total_steps": 1931, "loss": 0.0154, "lr": 3.292580808265897e-06, "epoch": 0.7614607614607615, "percentage": 76.13, "elapsed_time": "23:26:45", "remaining_time": "7:21:10"}
|
| 148 |
+
{"current_steps": 1480, "total_steps": 1931, "loss": 0.0152, "lr": 3.1595406120065174e-06, "epoch": 0.7666407666407666, "percentage": 76.64, "elapsed_time": "23:36:14", "remaining_time": "7:11:34"}
|
| 149 |
+
{"current_steps": 1490, "total_steps": 1931, "loss": 0.0148, "lr": 3.0287379698164245e-06, "epoch": 0.7718207718207718, "percentage": 77.16, "elapsed_time": "23:45:36", "remaining_time": "7:01:56"}
|
| 150 |
+
{"current_steps": 1500, "total_steps": 1931, "loss": 0.0161, "lr": 2.900215668000991e-06, "epoch": 0.777000777000777, "percentage": 77.68, "elapsed_time": "23:55:19", "remaining_time": "6:52:24"}
|