Commit ·
e5e22d8
1
Parent(s): 3012035
Save best model. Best metric: val/loss:0.06462528556585312- epoch:0
Browse files- README.md +4 -4
- config.json +1 -1
- config_sentence_transformers.json +2 -2
- model.safetensors +1 -1
README.md
CHANGED
|
@@ -82,7 +82,7 @@ The model was trained with the parameters:
|
|
| 82 |
|
| 83 |
**DataLoader**:
|
| 84 |
|
| 85 |
-
`torch.utils.data.dataloader.DataLoader` of length
|
| 86 |
```
|
| 87 |
{'batch_size': 14, 'sampler': 'torch.utils.data.sampler.RandomSampler', 'batch_sampler': 'torch.utils.data.sampler.BatchSampler'}
|
| 88 |
```
|
|
@@ -94,16 +94,16 @@ The model was trained with the parameters:
|
|
| 94 |
Parameters of the fit()-Method:
|
| 95 |
```
|
| 96 |
{
|
| 97 |
-
"epochs":
|
| 98 |
"evaluation_steps": 0,
|
| 99 |
"evaluator": "NoneType",
|
| 100 |
"max_grad_norm": 1,
|
| 101 |
"optimizer_class": "<class 'torch.optim.adamw.AdamW'>",
|
| 102 |
"optimizer_params": {
|
| 103 |
-
"lr":
|
| 104 |
},
|
| 105 |
"scheduler": "WarmupLinear",
|
| 106 |
-
"steps_per_epoch":
|
| 107 |
"warmup_steps": 5000,
|
| 108 |
"weight_decay": 0.0001
|
| 109 |
}
|
|
|
|
| 82 |
|
| 83 |
**DataLoader**:
|
| 84 |
|
| 85 |
+
`torch.utils.data.dataloader.DataLoader` of length 7843 with parameters:
|
| 86 |
```
|
| 87 |
{'batch_size': 14, 'sampler': 'torch.utils.data.sampler.RandomSampler', 'batch_sampler': 'torch.utils.data.sampler.BatchSampler'}
|
| 88 |
```
|
|
|
|
| 94 |
Parameters of the fit()-Method:
|
| 95 |
```
|
| 96 |
{
|
| 97 |
+
"epochs": 5,
|
| 98 |
"evaluation_steps": 0,
|
| 99 |
"evaluator": "NoneType",
|
| 100 |
"max_grad_norm": 1,
|
| 101 |
"optimizer_class": "<class 'torch.optim.adamw.AdamW'>",
|
| 102 |
"optimizer_params": {
|
| 103 |
+
"lr": 3e-05
|
| 104 |
},
|
| 105 |
"scheduler": "WarmupLinear",
|
| 106 |
+
"steps_per_epoch": null,
|
| 107 |
"warmup_steps": 5000,
|
| 108 |
"weight_decay": 0.0001
|
| 109 |
}
|
config.json
CHANGED
|
@@ -1,5 +1,5 @@
|
|
| 1 |
{
|
| 2 |
-
"_name_or_path": "
|
| 3 |
"architectures": [
|
| 4 |
"BertModel"
|
| 5 |
],
|
|
|
|
| 1 |
{
|
| 2 |
+
"_name_or_path": "D:\\Work\\Tasks\\mylong_ds/.cache\\quannguyenopus_tsdae-host\\",
|
| 3 |
"architectures": [
|
| 4 |
"BertModel"
|
| 5 |
],
|
config_sentence_transformers.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
"__version__": {
|
| 3 |
"sentence_transformers": "2.2.2",
|
| 4 |
-
"transformers": "4.
|
| 5 |
-
"pytorch": "2.
|
| 6 |
}
|
| 7 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"__version__": {
|
| 3 |
"sentence_transformers": "2.2.2",
|
| 4 |
+
"transformers": "4.31.0",
|
| 5 |
+
"pytorch": "2.0.1+cu118"
|
| 6 |
}
|
| 7 |
}
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 90864192
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:dcccb6444c73d471ff3fc87a4c4f30481d4e9e8d143e27bb017e7ec0841d40e2
|
| 3 |
size 90864192
|