Training in progress, epoch 1, checkpoint
Browse files
checkpoint-22/README.md
CHANGED
|
@@ -98,9 +98,9 @@ print(embeddings.shape)
|
|
| 98 |
# Get the similarity scores for the embeddings
|
| 99 |
similarities = model.similarity(embeddings, embeddings)
|
| 100 |
print(similarities)
|
| 101 |
-
# tensor([[1.0000, 0.
|
| 102 |
-
# [0.
|
| 103 |
-
# [0.
|
| 104 |
```
|
| 105 |
|
| 106 |
<!--
|
|
@@ -174,6 +174,7 @@ You can finetune this model on your own dataset.
|
|
| 174 |
- `per_device_eval_batch_size`: 16
|
| 175 |
- `learning_rate`: 2e-05
|
| 176 |
- `weight_decay`: 0.001
|
|
|
|
| 177 |
- `warmup_ratio`: 0.2
|
| 178 |
- `fp16`: True
|
| 179 |
- `dataloader_num_workers`: 2
|
|
@@ -204,7 +205,7 @@ You can finetune this model on your own dataset.
|
|
| 204 |
- `adam_beta2`: 0.999
|
| 205 |
- `adam_epsilon`: 1e-08
|
| 206 |
- `max_grad_norm`: 1.0
|
| 207 |
-
- `num_train_epochs`:
|
| 208 |
- `max_steps`: -1
|
| 209 |
- `lr_scheduler_type`: linear
|
| 210 |
- `lr_scheduler_kwargs`: {}
|
|
@@ -311,7 +312,7 @@ You can finetune this model on your own dataset.
|
|
| 311 |
| Epoch | Step | Training Loss |
|
| 312 |
|:------:|:----:|:-------------:|
|
| 313 |
| 0.0455 | 1 | 3.3947 |
|
| 314 |
-
| 1.0 | 22 | 2.
|
| 315 |
|
| 316 |
|
| 317 |
### Framework Versions
|
|
|
|
| 98 |
# Get the similarity scores for the embeddings
|
| 99 |
similarities = model.similarity(embeddings, embeddings)
|
| 100 |
print(similarities)
|
| 101 |
+
# tensor([[1.0000, 0.9027, 0.4485],
|
| 102 |
+
# [0.9027, 1.0000, 0.4446],
|
| 103 |
+
# [0.4485, 0.4446, 1.0000]])
|
| 104 |
```
|
| 105 |
|
| 106 |
<!--
|
|
|
|
| 174 |
- `per_device_eval_batch_size`: 16
|
| 175 |
- `learning_rate`: 2e-05
|
| 176 |
- `weight_decay`: 0.001
|
| 177 |
+
- `num_train_epochs`: 2
|
| 178 |
- `warmup_ratio`: 0.2
|
| 179 |
- `fp16`: True
|
| 180 |
- `dataloader_num_workers`: 2
|
|
|
|
| 205 |
- `adam_beta2`: 0.999
|
| 206 |
- `adam_epsilon`: 1e-08
|
| 207 |
- `max_grad_norm`: 1.0
|
| 208 |
+
- `num_train_epochs`: 2
|
| 209 |
- `max_steps`: -1
|
| 210 |
- `lr_scheduler_type`: linear
|
| 211 |
- `lr_scheduler_kwargs`: {}
|
|
|
|
| 312 |
| Epoch | Step | Training Loss |
|
| 313 |
|:------:|:----:|:-------------:|
|
| 314 |
| 0.0455 | 1 | 3.3947 |
|
| 315 |
+
| 1.0 | 22 | 2.7163 |
|
| 316 |
|
| 317 |
|
| 318 |
### Framework Versions
|
checkpoint-22/model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:44dc75dc88eaa963e3e29998f9ff2c4b342c2b9cc828ed5cc8f06f722ac95d5d
|
| 3 |
size 90864192
|
checkpoint-22/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 85254842
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e3715e5cad0bd7354d05fea88cf40f306a6bc22d5b34fd5f23d539ccc5cb287d
|
| 3 |
size 85254842
|
checkpoint-22/scheduler.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1064
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ee0889d2e1f8f81ca0859895fa3b9cec01c8ba200e1012155e6d6bf09d3f55f1
|
| 3 |
size 1064
|
checkpoint-22/trainer_state.json
CHANGED
|
@@ -18,16 +18,16 @@
|
|
| 18 |
},
|
| 19 |
{
|
| 20 |
"epoch": 1.0,
|
| 21 |
-
"grad_norm": 25.
|
| 22 |
-
"learning_rate": 1.
|
| 23 |
-
"loss": 2.
|
| 24 |
"step": 22
|
| 25 |
}
|
| 26 |
],
|
| 27 |
"logging_steps": 500,
|
| 28 |
-
"max_steps":
|
| 29 |
"num_input_tokens_seen": 0,
|
| 30 |
-
"num_train_epochs":
|
| 31 |
"save_steps": 500,
|
| 32 |
"stateful_callbacks": {
|
| 33 |
"TrainerControl": {
|
|
|
|
| 18 |
},
|
| 19 |
{
|
| 20 |
"epoch": 1.0,
|
| 21 |
+
"grad_norm": 25.27043342590332,
|
| 22 |
+
"learning_rate": 1.3142857142857145e-05,
|
| 23 |
+
"loss": 2.7163,
|
| 24 |
"step": 22
|
| 25 |
}
|
| 26 |
],
|
| 27 |
"logging_steps": 500,
|
| 28 |
+
"max_steps": 44,
|
| 29 |
"num_input_tokens_seen": 0,
|
| 30 |
+
"num_train_epochs": 2,
|
| 31 |
"save_steps": 500,
|
| 32 |
"stateful_callbacks": {
|
| 33 |
"TrainerControl": {
|
checkpoint-22/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5752
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9e91a92ff4d4228b61d5b3b1e6c465ed3cfe5a67113276860cdd9a2015549963
|
| 3 |
size 5752
|