Training in progress, step 1000, checkpoint
Browse files- last-checkpoint/2_Dense/model.safetensors +1 -1
- last-checkpoint/3_Dense/model.safetensors +1 -1
- last-checkpoint/README.md +5 -1
- last-checkpoint/model.safetensors +1 -1
- last-checkpoint/optimizer.pt +1 -1
- last-checkpoint/scaler.pt +1 -1
- last-checkpoint/scheduler.pt +1 -1
- last-checkpoint/trainer_state.json +30 -2
last-checkpoint/2_Dense/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 9437272
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:00693ca726c3aa172fe54b2bbf0f5a2ac7ef3e0f15e6ef10272ea4e790f1a7ea
|
| 3 |
size 9437272
|
last-checkpoint/3_Dense/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 9437272
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1ec4b258539975d8b345245718777e000a517241aa23cc10eb37dd6ffc792aab
|
| 3 |
size 9437272
|
last-checkpoint/README.md
CHANGED
|
@@ -450,7 +450,7 @@ print(query_embeddings.shape, document_embeddings.shape)
|
|
| 450 |
# Get the similarity scores for the embeddings
|
| 451 |
similarities = model.similarity(query_embeddings, document_embeddings)
|
| 452 |
print(similarities)
|
| 453 |
-
# tensor([[ 0.
|
| 454 |
```
|
| 455 |
|
| 456 |
<!--
|
|
@@ -703,6 +703,10 @@ You can finetune this model on your own dataset.
|
|
| 703 |
| 0.2316 | 700 | 0.1013 |
|
| 704 |
| 0.2482 | 750 | 0.1019 |
|
| 705 |
| 0.2647 | 800 | 0.0964 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 706 |
|
| 707 |
|
| 708 |
### Framework Versions
|
|
|
|
| 450 |
# Get the similarity scores for the embeddings
|
| 451 |
similarities = model.similarity(query_embeddings, document_embeddings)
|
| 452 |
print(similarities)
|
| 453 |
+
# tensor([[ 0.4709, -0.1225, 0.1580]])
|
| 454 |
```
|
| 455 |
|
| 456 |
<!--
|
|
|
|
| 703 |
| 0.2316 | 700 | 0.1013 |
|
| 704 |
| 0.2482 | 750 | 0.1019 |
|
| 705 |
| 0.2647 | 800 | 0.0964 |
|
| 706 |
+
| 0.2813 | 850 | 0.0961 |
|
| 707 |
+
| 0.2978 | 900 | 0.0927 |
|
| 708 |
+
| 0.3144 | 950 | 0.0946 |
|
| 709 |
+
| 0.3309 | 1000 | 0.0988 |
|
| 710 |
|
| 711 |
|
| 712 |
### Framework Versions
|
last-checkpoint/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1211486072
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:13ac8f3e49e96856b9bc03370f38b3741180dcb037151388805051f7ea3ffe8f
|
| 3 |
size 1211486072
|
last-checkpoint/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 2460923467
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:45310978fd3a8f93b72bef2a6c703555d44d1cb9ff7e494d4ad2616538a9ff9b
|
| 3 |
size 2460923467
|
last-checkpoint/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1383
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fc83c3e7cbaa37ce1778897d2e62cb7b8c41ece6f6ed0596eecff4f3f73fcd86
|
| 3 |
size 1383
|
last-checkpoint/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1465
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:220ab6d106cef455c6160d9f0f26a124a8032f6a0351c6a17f6905e5df60789d
|
| 3 |
size 1465
|
last-checkpoint/trainer_state.json
CHANGED
|
@@ -2,9 +2,9 @@
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
-
"epoch": 0.
|
| 6 |
"eval_steps": 500,
|
| 7 |
-
"global_step":
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
@@ -120,6 +120,34 @@
|
|
| 120 |
"learning_rate": 1.6351599852887092e-05,
|
| 121 |
"loss": 0.0964,
|
| 122 |
"step": 800
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 123 |
}
|
| 124 |
],
|
| 125 |
"logging_steps": 50,
|
|
|
|
| 2 |
"best_global_step": null,
|
| 3 |
"best_metric": null,
|
| 4 |
"best_model_checkpoint": null,
|
| 5 |
+
"epoch": 0.3309066843150232,
|
| 6 |
"eval_steps": 500,
|
| 7 |
+
"global_step": 1000,
|
| 8 |
"is_hyper_param_search": false,
|
| 9 |
"is_local_process_zero": true,
|
| 10 |
"is_world_process_zero": true,
|
|
|
|
| 120 |
"learning_rate": 1.6351599852887092e-05,
|
| 121 |
"loss": 0.0964,
|
| 122 |
"step": 800
|
| 123 |
+
},
|
| 124 |
+
{
|
| 125 |
+
"epoch": 0.2812706816677697,
|
| 126 |
+
"grad_norm": 6.790607929229736,
|
| 127 |
+
"learning_rate": 1.5983817579992645e-05,
|
| 128 |
+
"loss": 0.0961,
|
| 129 |
+
"step": 850
|
| 130 |
+
},
|
| 131 |
+
{
|
| 132 |
+
"epoch": 0.29781601588352086,
|
| 133 |
+
"grad_norm": 6.981550693511963,
|
| 134 |
+
"learning_rate": 1.56160353070982e-05,
|
| 135 |
+
"loss": 0.0927,
|
| 136 |
+
"step": 900
|
| 137 |
+
},
|
| 138 |
+
{
|
| 139 |
+
"epoch": 0.314361350099272,
|
| 140 |
+
"grad_norm": 4.593362808227539,
|
| 141 |
+
"learning_rate": 1.5248253034203752e-05,
|
| 142 |
+
"loss": 0.0946,
|
| 143 |
+
"step": 950
|
| 144 |
+
},
|
| 145 |
+
{
|
| 146 |
+
"epoch": 0.3309066843150232,
|
| 147 |
+
"grad_norm": 4.783601760864258,
|
| 148 |
+
"learning_rate": 1.4880470761309307e-05,
|
| 149 |
+
"loss": 0.0988,
|
| 150 |
+
"step": 1000
|
| 151 |
}
|
| 152 |
],
|
| 153 |
"logging_steps": 50,
|