Training in progress, step 49800, checkpoint
Browse files
last-checkpoint/README.md
CHANGED
|
@@ -1285,6 +1285,10 @@ You can finetune this model on your own dataset.
|
|
| 1285 |
| 0.8747 | 49500 | 0.3182 |
|
| 1286 |
| 0.8756 | 49550 | 0.3063 |
|
| 1287 |
| 0.8765 | 49600 | 0.2385 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1288 |
|
| 1289 |
|
| 1290 |
### Framework Versions
|
|
|
|
| 1285 |
| 0.8747 | 49500 | 0.3182 |
|
| 1286 |
| 0.8756 | 49550 | 0.3063 |
|
| 1287 |
| 0.8765 | 49600 | 0.2385 |
|
| 1288 |
+
| 0.8773 | 49650 | 0.3152 |
|
| 1289 |
+
| 0.8782 | 49700 | 0.267 |
|
| 1290 |
+
| 0.8791 | 49750 | 0.2599 |
|
| 1291 |
+
| 0.8800 | 49800 | 0.3226 |
|
| 1292 |
|
| 1293 |
|
| 1294 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ed2d369eb5785f37e695387aeb0f0e1b88aba7649dea47063848b806090ff91f
|
| 3 |
size 90864192
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 180609210
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7c88873a80431132be5b9a6198db1d2eb68145fe27f94342674f074b433cbd62
|
| 3 |
size 180609210
|
last-checkpoint/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 14244
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a0c031c47895ee65720a29aa486037b758096a0c008e8c7d3bf0a06b848dd598
|
| 3 |
size 14244
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:98ce6fbeef0ab2e0cecf23435bfa5221dc56a6ce59fe8d9b84d1e42bcc5d69c4
|
| 3 |
size 988
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1cd200196e0f200dd4627f60d44a82669aaadc601edaa64b9c6e1ddba3c662c9
|
| 3 |
size 1064
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -6952,6 +6952,34 @@
|
|
| 6952 |
"learning_rate": 6.8828414914295815e-06,
|
| 6953 |
"loss": 0.2385,
|
| 6954 |
"step": 49600
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 6955 |
}
|
| 6956 |
],
|
| 6957 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.8799985863476525,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 49800,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 6952 |
"learning_rate": 6.8828414914295815e-06,
|
| 6953 |
"loss": 0.2385,
|
| 6954 |
"step": 49600
|
| 6955 |
+
},
|
| 6956 |
+
{
|
| 6957 |
+
"epoch": 0.8773479881960029,
|
| 6958 |
+
"grad_norm": 1.3927173614501953,
|
| 6959 |
+
"learning_rate": 6.833755473091045e-06,
|
| 6960 |
+
"loss": 0.3152,
|
| 6961 |
+
"step": 49650
|
| 6962 |
+
},
|
| 6963 |
+
{
|
| 6964 |
+
"epoch": 0.8782315209132194,
|
| 6965 |
+
"grad_norm": 1.4090054035186768,
|
| 6966 |
+
"learning_rate": 6.784669454752508e-06,
|
| 6967 |
+
"loss": 0.267,
|
| 6968 |
+
"step": 49700
|
| 6969 |
+
},
|
| 6970 |
+
{
|
| 6971 |
+
"epoch": 0.879115053630436,
|
| 6972 |
+
"grad_norm": 1.5765697956085205,
|
| 6973 |
+
"learning_rate": 6.735583436413972e-06,
|
| 6974 |
+
"loss": 0.2599,
|
| 6975 |
+
"step": 49750
|
| 6976 |
+
},
|
| 6977 |
+
{
|
| 6978 |
+
"epoch": 0.8799985863476525,
|
| 6979 |
+
"grad_norm": 1.617443323135376,
|
| 6980 |
+
"learning_rate": 6.686497418075435e-06,
|
| 6981 |
+
"loss": 0.3226,
|
| 6982 |
+
"step": 49800
|
| 6983 |
}
|
| 6984 |
],
|
| 6985 |
"logging_steps": 50,
|