Training in progress, epoch 1, checkpoint
Browse files- checkpoint-43/README.md +4 -4
- checkpoint-43/model.safetensors +1 -1
- checkpoint-43/optimizer.pt +2 -2
- checkpoint-43/scaler.pt +1 -1
- checkpoint-43/scheduler.pt +1 -1
- checkpoint-43/trainer_state.json +4 -4
- checkpoint-43/training_args.bin +1 -1
checkpoint-43/README.md
CHANGED
|
@@ -98,9 +98,9 @@ print(embeddings.shape)
|
|
| 98 |
# Get the similarity scores for the embeddings
|
| 99 |
similarities = model.similarity(embeddings, embeddings)
|
| 100 |
print(similarities)
|
| 101 |
-
# tensor([[1.0000, 0.
|
| 102 |
-
# [0.
|
| 103 |
-
# [0.
|
| 104 |
```
|
| 105 |
|
| 106 |
<!--
|
|
@@ -312,7 +312,7 @@ You can finetune this model on your own dataset.
|
|
| 312 |
| Epoch | Step | Training Loss |
|
| 313 |
|:------:|:----:|:-------------:|
|
| 314 |
| 0.0233 | 1 | 2.5914 |
|
| 315 |
-
| 1.0 | 43 | 2.
|
| 316 |
|
| 317 |
|
| 318 |
### Framework Versions
|
|
|
|
| 98 |
# Get the similarity scores for the embeddings
|
| 99 |
similarities = model.similarity(embeddings, embeddings)
|
| 100 |
print(similarities)
|
| 101 |
+
# tensor([[1.0000, 0.9007, 0.4676],
|
| 102 |
+
# [0.9007, 1.0000, 0.4624],
|
| 103 |
+
# [0.4676, 0.4624, 1.0000]])
|
| 104 |
```
|
| 105 |
|
| 106 |
<!--
|
|
|
|
| 312 |
| Epoch | Step | Training Loss |
|
| 313 |
|:------:|:----:|:-------------:|
|
| 314 |
| 0.0233 | 1 | 2.5914 |
|
| 315 |
+
| 1.0 | 43 | 2.1891 |
|
| 316 |
|
| 317 |
|
| 318 |
### Framework Versions
|
checkpoint-43/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f50a0cca591d7a769c2fe6e6b0856e64ef71e4ab0334e45baca8851a6ae41293
|
| 3 |
size 90864192
|
checkpoint-43/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:96d3d58ba60b0b7452ffde48c753a7977aed1b87a67c8734cb934e7f8cdfbdc6
|
| 3 |
+
size 71045818
|
checkpoint-43/scaler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 988
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d1bfb34fc594a255d8d9883559f9c507f4ab597426c0530a298f905d8357fa14
|
| 3 |
size 988
|
checkpoint-43/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:192eb4a369a802fe9cbb56bc0941e56d3a280b6a6d0c5fc0f648043259afaba6
|
| 3 |
size 1064
|
checkpoint-43/trainer_state.json
CHANGED
|
@@ -11,16 +11,16 @@
|
|
| 11 |
"log_history": [
|
| 12 |
{
|
| 13 |
"epoch": 0.023255813953488372,
|
| 14 |
-
"grad_norm":
|
| 15 |
"learning_rate": 0.0,
|
| 16 |
"loss": 2.5914,
|
| 17 |
"step": 1
|
| 18 |
},
|
| 19 |
{
|
| 20 |
"epoch": 1.0,
|
| 21 |
-
"grad_norm":
|
| 22 |
-
"learning_rate": 1.
|
| 23 |
-
"loss": 2.
|
| 24 |
"step": 43
|
| 25 |
}
|
| 26 |
],
|
|
|
|
| 11 |
"log_history": [
|
| 12 |
{
|
| 13 |
"epoch": 0.023255813953488372,
|
| 14 |
+
"grad_norm": 22.848411560058594,
|
| 15 |
"learning_rate": 0.0,
|
| 16 |
"loss": 2.5914,
|
| 17 |
"step": 1
|
| 18 |
},
|
| 19 |
{
|
| 20 |
"epoch": 1.0,
|
| 21 |
+
"grad_norm": 20.43097496032715,
|
| 22 |
+
"learning_rate": 1.323529411764706e-05,
|
| 23 |
+
"loss": 2.1891,
|
| 24 |
"step": 43
|
| 25 |
}
|
| 26 |
],
|
checkpoint-43/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5752
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:38d573d7ed89a9c75acf2340821fe907e16db1f608f1624a2970d502b84c6505
|
| 3 |
size 5752
|