Training in progress, step 2200, checkpoint
Browse files- last-checkpoint/2_Dense/model.safetensors +1 -1
- last-checkpoint/3_Dense/model.safetensors +1 -1
- last-checkpoint/README.md +5 -1
- last-checkpoint/model.safetensors +1 -1
- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/scaler.pt +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +30 -2
last-checkpoint/2_Dense/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 9437272
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:bc70cd979bc0f8d6854ac24389fb9983bd7c1348da5adf8b9ce14ea9c13e1437
|
| 3 |
size 9437272
|
last-checkpoint/3_Dense/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 9437272
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:da87d038bf430393d72e8162a91cdaf090b88f744ba76c25999544816381f7ca
|
| 3 |
size 9437272
|
last-checkpoint/README.md
CHANGED
|
@@ -450,7 +450,7 @@ print(query_embeddings.shape, document_embeddings.shape)
|
|
| 450 |
# Get the similarity scores for the embeddings
|
| 451 |
similarities = model.similarity(query_embeddings, document_embeddings)
|
| 452 |
print(similarities)
|
| 453 |
-
# tensor([[ 0.
|
| 454 |
```
|
| 455 |
|
| 456 |
<!--
|
|
@@ -727,6 +727,10 @@ You can finetune this model on your own dataset.
|
|
| 727 |
| 0.6287 | 1900 | 0.085 |
|
| 728 |
| 0.6453 | 1950 | 0.0661 |
|
| 729 |
| 0.6618 | 2000 | 0.0676 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 730 |
|
| 731 |
|
| 732 |
### Framework Versions
|
|
|
|
| 450 |
# Get the similarity scores for the embeddings
|
| 451 |
similarities = model.similarity(query_embeddings, document_embeddings)
|
| 452 |
print(similarities)
|
| 453 |
+
# tensor([[ 0.5013, -0.1183, 0.2914]])
|
| 454 |
```
|
| 455 |
|
| 456 |
<!--
|
|
|
|
| 727 |
| 0.6287 | 1900 | 0.085 |
|
| 728 |
| 0.6453 | 1950 | 0.0661 |
|
| 729 |
| 0.6618 | 2000 | 0.0676 |
|
| 730 |
+
| 0.6784 | 2050 | 0.0598 |
|
| 731 |
+
| 0.6949 | 2100 | 0.0734 |
|
| 732 |
+
| 0.7114 | 2150 | 0.0653 |
|
| 733 |
+
| 0.7280 | 2200 | 0.0751 |
|
| 734 |
|
| 735 |
|
| 736 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1211486072
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0473cfcb7e3c364fd02654b46c9d660aaf46bf1670ce0cb4ce0ebb6d79517a7f
|
| 3 |
size 1211486072
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2460923467
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:46eae69537d2228e82f1efd9242173793094fb832fc89a291b843d223ca72e45
|
| 3 |
size 2460923467
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1383
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:514519403b4ca514f8ce9852255fb8898d761d1af37eddca5abb7c9fcbc625f2
|
| 3 |
size 1383
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1465
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2a5514a935e35b6a4a520541aa5fd6620a939141d2380504a718d93807ed07a4
|
| 3 |
size 1465
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -288,6 +288,34 @@
|
|
| 288 |
"learning_rate": 7.524825303420375e-06,
|
| 289 |
"loss": 0.0676,
|
| 290 |
"step": 2000
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 291 |
}
|
| 292 |
],
|
| 293 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.727994705493051,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 2200,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 288 |
"learning_rate": 7.524825303420375e-06,
|
| 289 |
"loss": 0.0676,
|
| 290 |
"step": 2000
|
| 291 |
+
},
|
| 292 |
+
{
|
| 293 |
+
"epoch": 0.6783587028457975,
|
| 294 |
+
"grad_norm": 4.1648077964782715,
|
| 295 |
+
"learning_rate": 7.157043030525929e-06,
|
| 296 |
+
"loss": 0.0598,
|
| 297 |
+
"step": 2050
|
| 298 |
+
},
|
| 299 |
+
{
|
| 300 |
+
"epoch": 0.6949040370615487,
|
| 301 |
+
"grad_norm": 7.234411716461182,
|
| 302 |
+
"learning_rate": 6.789260757631483e-06,
|
| 303 |
+
"loss": 0.0734,
|
| 304 |
+
"step": 2100
|
| 305 |
+
},
|
| 306 |
+
{
|
| 307 |
+
"epoch": 0.7114493712772998,
|
| 308 |
+
"grad_norm": 6.458765029907227,
|
| 309 |
+
"learning_rate": 6.421478484737036e-06,
|
| 310 |
+
"loss": 0.0653,
|
| 311 |
+
"step": 2150
|
| 312 |
+
},
|
| 313 |
+
{
|
| 314 |
+
"epoch": 0.727994705493051,
|
| 315 |
+
"grad_norm": 4.6173930168151855,
|
| 316 |
+
"learning_rate": 6.05369621184259e-06,
|
| 317 |
+
"loss": 0.0751,
|
| 318 |
+
"step": 2200
|
| 319 |
}
|
| 320 |
],
|
| 321 |
"logging_steps": 50,
|