Training in progress, step 1400, checkpoint
Browse files- last-checkpoint/2_Dense/model.safetensors +1 -1
- last-checkpoint/3_Dense/model.safetensors +1 -1
- last-checkpoint/README.md +5 -1
- last-checkpoint/model.safetensors +1 -1
- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/scaler.pt +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +30 -2
last-checkpoint/2_Dense/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 9437272
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:14549a8f2b505a8545ac674725066f9c305d15592336942bb065ad4f6ddeb306
|
| 3 |
size 9437272
|
last-checkpoint/3_Dense/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 9437272
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0952aa81b7cdd3daf666c37d0854e5bff5e7a14e28b4874444f7772caeb46f9d
|
| 3 |
size 9437272
|
last-checkpoint/README.md
CHANGED
|
@@ -450,7 +450,7 @@ print(query_embeddings.shape, document_embeddings.shape)
|
|
| 450 |
# Get the similarity scores for the embeddings
|
| 451 |
similarities = model.similarity(query_embeddings, document_embeddings)
|
| 452 |
print(similarities)
|
| 453 |
-
# tensor([[ 0.
|
| 454 |
```
|
| 455 |
|
| 456 |
<!--
|
|
@@ -711,6 +711,10 @@ You can finetune this model on your own dataset.
|
|
| 711 |
| 0.3640 | 1100 | 0.091 |
|
| 712 |
| 0.3805 | 1150 | 0.0802 |
|
| 713 |
| 0.3971 | 1200 | 0.0824 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 714 |
|
| 715 |
|
| 716 |
### Framework Versions
|
|
|
|
| 450 |
# Get the similarity scores for the embeddings
|
| 451 |
similarities = model.similarity(query_embeddings, document_embeddings)
|
| 452 |
print(similarities)
|
| 453 |
+
# tensor([[ 0.6231, -0.0744, 0.1279]])
|
| 454 |
```
|
| 455 |
|
| 456 |
<!--
|
|
|
|
| 711 |
| 0.3640 | 1100 | 0.091 |
|
| 712 |
| 0.3805 | 1150 | 0.0802 |
|
| 713 |
| 0.3971 | 1200 | 0.0824 |
|
| 714 |
+
| 0.4136 | 1250 | 0.0845 |
|
| 715 |
+
| 0.4302 | 1300 | 0.09 |
|
| 716 |
+
| 0.4467 | 1350 | 0.0866 |
|
| 717 |
+
| 0.4633 | 1400 | 0.0826 |
|
| 718 |
|
| 719 |
|
| 720 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1211486072
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:477457ae6906b9786bffa8dd6309187edd28e664410a059cfffacf1f2cae3bc6
|
| 3 |
size 1211486072
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2460923467
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6fcb82c0030f2e69a729cae162131808daef058010082ee7c6a1cdc5a1109b47
|
| 3 |
size 2460923467
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1383
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:3fcfe456f41c489958b10f637ef851405e803e7363ed9925c3152e6d7cebd14a
|
| 3 |
size 1383
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1465
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1807d5c010828dc5af6863500632317772ab24748d2f2f3dc9b74b307531f182
|
| 3 |
size 1465
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -176,6 +176,34 @@
|
|
| 176 |
"learning_rate": 1.3409341669731519e-05,
|
| 177 |
"loss": 0.0824,
|
| 178 |
"step": 1200
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 179 |
}
|
| 180 |
],
|
| 181 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.4632693580410324,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 1400,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 176 |
"learning_rate": 1.3409341669731519e-05,
|
| 177 |
"loss": 0.0824,
|
| 178 |
"step": 1200
|
| 179 |
+
},
|
| 180 |
+
{
|
| 181 |
+
"epoch": 0.41363335539377893,
|
| 182 |
+
"grad_norm": 2.9681406021118164,
|
| 183 |
+
"learning_rate": 1.3041559396837074e-05,
|
| 184 |
+
"loss": 0.0845,
|
| 185 |
+
"step": 1250
|
| 186 |
+
},
|
| 187 |
+
{
|
| 188 |
+
"epoch": 0.4301786896095301,
|
| 189 |
+
"grad_norm": 6.426875591278076,
|
| 190 |
+
"learning_rate": 1.2673777123942627e-05,
|
| 191 |
+
"loss": 0.09,
|
| 192 |
+
"step": 1300
|
| 193 |
+
},
|
| 194 |
+
{
|
| 195 |
+
"epoch": 0.44672402382528126,
|
| 196 |
+
"grad_norm": 8.284296035766602,
|
| 197 |
+
"learning_rate": 1.2305994851048179e-05,
|
| 198 |
+
"loss": 0.0866,
|
| 199 |
+
"step": 1350
|
| 200 |
+
},
|
| 201 |
+
{
|
| 202 |
+
"epoch": 0.4632693580410324,
|
| 203 |
+
"grad_norm": 5.250367164611816,
|
| 204 |
+
"learning_rate": 1.1938212578153734e-05,
|
| 205 |
+
"loss": 0.0826,
|
| 206 |
+
"step": 1400
|
| 207 |
}
|
| 208 |
],
|
| 209 |
"logging_steps": 50,
|