Training in progress, step 1800
Browse files- model.safetensors +1 -1
- trainer_log.jsonl +10 -0
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 3554214752
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3e9d264cd490b3b6424523c411878343957fda68cf5d8066f3ed7a6439a489a2
|
| 3 |
size 3554214752
|
trainer_log.jsonl
CHANGED
|
@@ -168,3 +168,13 @@
|
|
| 168 |
{"current_steps": 1680, "total_steps": 1931, "loss": 0.0151, "lr": 1.0207986885655664e-06, "epoch": 0.8702408702408703, "percentage": 87.0, "elapsed_time": "1 day, 2:48:18", "remaining_time": "4:00:17"}
|
| 169 |
{"current_steps": 1690, "total_steps": 1931, "loss": 0.015, "lr": 9.426631707752243e-07, "epoch": 0.8754208754208754, "percentage": 87.52, "elapsed_time": "1 day, 2:57:47", "remaining_time": "3:50:42"}
|
| 170 |
{"current_steps": 1700, "total_steps": 1931, "loss": 0.0155, "lr": 8.674903605648221e-07, "epoch": 0.8806008806008806, "percentage": 88.04, "elapsed_time": "1 day, 3:07:14", "remaining_time": "3:41:06"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 168 |
{"current_steps": 1680, "total_steps": 1931, "loss": 0.0151, "lr": 1.0207986885655664e-06, "epoch": 0.8702408702408703, "percentage": 87.0, "elapsed_time": "1 day, 2:48:18", "remaining_time": "4:00:17"}
|
| 169 |
{"current_steps": 1690, "total_steps": 1931, "loss": 0.015, "lr": 9.426631707752243e-07, "epoch": 0.8754208754208754, "percentage": 87.52, "elapsed_time": "1 day, 2:57:47", "remaining_time": "3:50:42"}
|
| 170 |
{"current_steps": 1700, "total_steps": 1931, "loss": 0.0155, "lr": 8.674903605648221e-07, "epoch": 0.8806008806008806, "percentage": 88.04, "elapsed_time": "1 day, 3:07:14", "remaining_time": "3:41:06"}
|
| 171 |
+
{"current_steps": 1710, "total_steps": 1931, "loss": 0.0149, "lr": 7.953048473980041e-07, "epoch": 0.8857808857808858, "percentage": 88.56, "elapsed_time": "1 day, 3:18:23", "remaining_time": "3:31:44"}
|
| 172 |
+
{"current_steps": 1720, "total_steps": 1931, "loss": 0.0155, "lr": 7.261302435761564e-07, "epoch": 0.8909608909608909, "percentage": 89.07, "elapsed_time": "1 day, 3:27:50", "remaining_time": "3:22:08"}
|
| 173 |
+
{"current_steps": 1730, "total_steps": 1931, "loss": 0.0148, "lr": 6.59989176514707e-07, "epoch": 0.8961408961408961, "percentage": 89.59, "elapsed_time": "1 day, 3:37:28", "remaining_time": "3:12:34"}
|
| 174 |
+
{"current_steps": 1740, "total_steps": 1931, "loss": 0.0145, "lr": 5.969032813415577e-07, "epoch": 0.9013209013209014, "percentage": 90.11, "elapsed_time": "1 day, 3:46:52", "remaining_time": "3:02:58"}
|
| 175 |
+
{"current_steps": 1750, "total_steps": 1931, "loss": 0.015, "lr": 5.368931938201006e-07, "epoch": 0.9065009065009065, "percentage": 90.63, "elapsed_time": "1 day, 3:56:16", "remaining_time": "2:53:22"}
|
| 176 |
+
{"current_steps": 1760, "total_steps": 1931, "loss": 0.0148, "lr": 4.799785435991577e-07, "epoch": 0.9116809116809117, "percentage": 91.14, "elapsed_time": "1 day, 4:05:36", "remaining_time": "2:43:46"}
|
| 177 |
+
{"current_steps": 1770, "total_steps": 1931, "loss": 0.0151, "lr": 4.261779477919892e-07, "epoch": 0.9168609168609169, "percentage": 91.66, "elapsed_time": "1 day, 4:14:44", "remaining_time": "2:34:09"}
|
| 178 |
+
{"current_steps": 1780, "total_steps": 1931, "loss": 0.0156, "lr": 3.755090048865406e-07, "epoch": 0.922040922040922, "percentage": 92.18, "elapsed_time": "1 day, 4:24:19", "remaining_time": "2:24:34"}
|
| 179 |
+
{"current_steps": 1790, "total_steps": 1931, "loss": 0.0147, "lr": 3.27988288988873e-07, "epoch": 0.9272209272209272, "percentage": 92.7, "elapsed_time": "1 day, 4:33:42", "remaining_time": "2:14:59"}
|
| 180 |
+
{"current_steps": 1800, "total_steps": 1931, "loss": 0.0151, "lr": 2.8363134440166806e-07, "epoch": 0.9324009324009324, "percentage": 93.22, "elapsed_time": "1 day, 4:43:03", "remaining_time": "2:05:24"}
|