Training in progress, step 3000, checkpoint
Browse files- last-checkpoint/2_Dense/model.safetensors +1 -1
- last-checkpoint/3_Dense/model.safetensors +1 -1
- last-checkpoint/README.md +5 -1
- last-checkpoint/model.safetensors +1 -1
- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/scaler.pt +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +30 -2
last-checkpoint/2_Dense/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 9437272
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ea38fe71b4fc93cbe68622a9309bd62ac567ce9362561aae1fb1413f1e1279c5
|
| 3 |
size 9437272
|
last-checkpoint/3_Dense/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 9437272
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6578a4180e63149bd07142c934c05e790e222b4bdafe8cbfb13ec6bb7b0eb990
|
| 3 |
size 9437272
|
last-checkpoint/README.md
CHANGED
|
@@ -450,7 +450,7 @@ print(query_embeddings.shape, document_embeddings.shape)
|
|
| 450 |
# Get the similarity scores for the embeddings
|
| 451 |
similarities = model.similarity(query_embeddings, document_embeddings)
|
| 452 |
print(similarities)
|
| 453 |
-
# tensor([[ 0.
|
| 454 |
```
|
| 455 |
|
| 456 |
<!--
|
|
@@ -743,6 +743,10 @@ You can finetune this model on your own dataset.
|
|
| 743 |
| 0.8934 | 2700 | 0.0619 |
|
| 744 |
| 0.9100 | 2750 | 0.0501 |
|
| 745 |
| 0.9265 | 2800 | 0.0488 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 746 |
|
| 747 |
|
| 748 |
### Framework Versions
|
|
|
|
| 450 |
# Get the similarity scores for the embeddings
|
| 451 |
similarities = model.similarity(query_embeddings, document_embeddings)
|
| 452 |
print(similarities)
|
| 453 |
+
# tensor([[ 0.5897, -0.1380, 0.2647]])
|
| 454 |
```
|
| 455 |
|
| 456 |
<!--
|
|
|
|
| 743 |
| 0.8934 | 2700 | 0.0619 |
|
| 744 |
| 0.9100 | 2750 | 0.0501 |
|
| 745 |
| 0.9265 | 2800 | 0.0488 |
|
| 746 |
+
| 0.9431 | 2850 | 0.0596 |
|
| 747 |
+
| 0.9596 | 2900 | 0.0514 |
|
| 748 |
+
| 0.9762 | 2950 | 0.0556 |
|
| 749 |
+
| 0.9927 | 3000 | 0.0395 |
|
| 750 |
|
| 751 |
|
| 752 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1211486072
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ef383b42a96cf989b5ea5f2f57691ed7f173177e227d8af401b1ce939eeeef0e
|
| 3 |
size 1211486072
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2460923467
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f8682dc9728a848b2d7b2200731d8a05575a66f7e9e9ba3f88c6ec383f5127ac
|
| 3 |
size 2460923467
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1383
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fb197e441ecbf3d517ec5cc71281886cf0daa798b522fd64348360f6a6763284
|
| 3 |
size 1383
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1465
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:879e85e1c6ae493744a544924cd5f86076951c82592e69abf0d8b51b66bc5e1a
|
| 3 |
size 1465
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -400,6 +400,34 @@
|
|
| 400 |
"learning_rate": 1.6403089371092316e-06,
|
| 401 |
"loss": 0.0488,
|
| 402 |
"step": 2800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 403 |
}
|
| 404 |
],
|
| 405 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.9927200529450695,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 3000,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 400 |
"learning_rate": 1.6403089371092316e-06,
|
| 401 |
"loss": 0.0488,
|
| 402 |
"step": 2800
|
| 403 |
+
},
|
| 404 |
+
{
|
| 405 |
+
"epoch": 0.9430840502978161,
|
| 406 |
+
"grad_norm": 8.403130531311035,
|
| 407 |
+
"learning_rate": 1.272526664214785e-06,
|
| 408 |
+
"loss": 0.0596,
|
| 409 |
+
"step": 2850
|
| 410 |
+
},
|
| 411 |
+
{
|
| 412 |
+
"epoch": 0.9596293845135672,
|
| 413 |
+
"grad_norm": 2.115785837173462,
|
| 414 |
+
"learning_rate": 9.047443913203384e-07,
|
| 415 |
+
"loss": 0.0514,
|
| 416 |
+
"step": 2900
|
| 417 |
+
},
|
| 418 |
+
{
|
| 419 |
+
"epoch": 0.9761747187293184,
|
| 420 |
+
"grad_norm": 4.952437400817871,
|
| 421 |
+
"learning_rate": 5.369621184258919e-07,
|
| 422 |
+
"loss": 0.0556,
|
| 423 |
+
"step": 2950
|
| 424 |
+
},
|
| 425 |
+
{
|
| 426 |
+
"epoch": 0.9927200529450695,
|
| 427 |
+
"grad_norm": 3.030841588973999,
|
| 428 |
+
"learning_rate": 1.691798455314454e-07,
|
| 429 |
+
"loss": 0.0395,
|
| 430 |
+
"step": 3000
|
| 431 |
}
|
| 432 |
],
|
| 433 |
"logging_steps": 50,
|