radoslavralev commited on
Commit
fe00935
·
verified ·
1 Parent(s): e108771

Add new SentenceTransformer model

Browse files
Files changed (1) hide show
  1. README.md +94 -94
README.md CHANGED
@@ -67,49 +67,49 @@ model-index:
67
  type: NanoMSMARCO
68
  metrics:
69
  - type: cosine_accuracy@1
70
- value: 0.3
71
  name: Cosine Accuracy@1
72
  - type: cosine_accuracy@3
73
- value: 0.62
74
  name: Cosine Accuracy@3
75
  - type: cosine_accuracy@5
76
- value: 0.7
77
  name: Cosine Accuracy@5
78
  - type: cosine_accuracy@10
79
- value: 0.76
80
  name: Cosine Accuracy@10
81
  - type: cosine_precision@1
82
- value: 0.3
83
  name: Cosine Precision@1
84
  - type: cosine_precision@3
85
- value: 0.20666666666666664
86
  name: Cosine Precision@3
87
  - type: cosine_precision@5
88
- value: 0.14
89
  name: Cosine Precision@5
90
  - type: cosine_precision@10
91
- value: 0.07600000000000001
92
  name: Cosine Precision@10
93
  - type: cosine_recall@1
94
- value: 0.3
95
  name: Cosine Recall@1
96
  - type: cosine_recall@3
97
- value: 0.62
98
  name: Cosine Recall@3
99
  - type: cosine_recall@5
100
- value: 0.7
101
  name: Cosine Recall@5
102
  - type: cosine_recall@10
103
- value: 0.76
104
  name: Cosine Recall@10
105
  - type: cosine_ndcg@10
106
- value: 0.5415969332190478
107
  name: Cosine Ndcg@10
108
  - type: cosine_mrr@10
109
- value: 0.47016666666666657
110
  name: Cosine Mrr@10
111
  - type: cosine_map@100
112
- value: 0.4817150619220429
113
  name: Cosine Map@100
114
  - task:
115
  type: information-retrieval
@@ -119,49 +119,49 @@ model-index:
119
  type: NanoNQ
120
  metrics:
121
  - type: cosine_accuracy@1
122
- value: 0.38
123
  name: Cosine Accuracy@1
124
  - type: cosine_accuracy@3
125
- value: 0.56
126
  name: Cosine Accuracy@3
127
  - type: cosine_accuracy@5
128
- value: 0.62
129
  name: Cosine Accuracy@5
130
  - type: cosine_accuracy@10
131
- value: 0.7
132
  name: Cosine Accuracy@10
133
  - type: cosine_precision@1
134
- value: 0.38
135
  name: Cosine Precision@1
136
  - type: cosine_precision@3
137
- value: 0.19333333333333333
138
  name: Cosine Precision@3
139
  - type: cosine_precision@5
140
- value: 0.132
141
  name: Cosine Precision@5
142
  - type: cosine_precision@10
143
- value: 0.07400000000000001
144
  name: Cosine Precision@10
145
  - type: cosine_recall@1
146
- value: 0.35
147
  name: Cosine Recall@1
148
  - type: cosine_recall@3
149
- value: 0.54
150
  name: Cosine Recall@3
151
  - type: cosine_recall@5
152
- value: 0.6
153
  name: Cosine Recall@5
154
  - type: cosine_recall@10
155
- value: 0.68
156
  name: Cosine Recall@10
157
  - type: cosine_ndcg@10
158
- value: 0.5219456964879438
159
  name: Cosine Ndcg@10
160
  - type: cosine_mrr@10
161
- value: 0.4853333333333334
162
  name: Cosine Mrr@10
163
  - type: cosine_map@100
164
- value: 0.47424546661452993
165
  name: Cosine Map@100
166
  - task:
167
  type: nano-beir
@@ -171,49 +171,49 @@ model-index:
171
  type: NanoBEIR_mean
172
  metrics:
173
  - type: cosine_accuracy@1
174
- value: 0.33999999999999997
175
  name: Cosine Accuracy@1
176
  - type: cosine_accuracy@3
177
- value: 0.5900000000000001
178
  name: Cosine Accuracy@3
179
  - type: cosine_accuracy@5
180
- value: 0.6599999999999999
181
  name: Cosine Accuracy@5
182
  - type: cosine_accuracy@10
183
- value: 0.73
184
  name: Cosine Accuracy@10
185
  - type: cosine_precision@1
186
- value: 0.33999999999999997
187
  name: Cosine Precision@1
188
  - type: cosine_precision@3
189
- value: 0.19999999999999998
190
  name: Cosine Precision@3
191
  - type: cosine_precision@5
192
- value: 0.136
193
  name: Cosine Precision@5
194
  - type: cosine_precision@10
195
- value: 0.07500000000000001
196
  name: Cosine Precision@10
197
  - type: cosine_recall@1
198
- value: 0.32499999999999996
199
  name: Cosine Recall@1
200
  - type: cosine_recall@3
201
- value: 0.5800000000000001
202
  name: Cosine Recall@3
203
  - type: cosine_recall@5
204
- value: 0.6499999999999999
205
  name: Cosine Recall@5
206
  - type: cosine_recall@10
207
- value: 0.72
208
  name: Cosine Recall@10
209
  - type: cosine_ndcg@10
210
- value: 0.5317713148534957
211
  name: Cosine Ndcg@10
212
  - type: cosine_mrr@10
213
- value: 0.47775
214
  name: Cosine Mrr@10
215
  - type: cosine_map@100
216
- value: 0.47798026426828644
217
  name: Cosine Map@100
218
  ---
219
 
@@ -278,9 +278,9 @@ print(embeddings.shape)
278
  # Get the similarity scores for the embeddings
279
  similarities = model.similarity(embeddings, embeddings)
280
  print(similarities)
281
- # tensor([[1.0000, 0.7584, 0.1067],
282
- # [0.7584, 1.0000, 0.0503],
283
- # [0.1067, 0.0503, 1.0000]])
284
  ```
285
 
286
  <!--
@@ -318,21 +318,21 @@ You can finetune this model on your own dataset.
318
 
319
  | Metric | NanoMSMARCO | NanoNQ |
320
  |:--------------------|:------------|:-----------|
321
- | cosine_accuracy@1 | 0.3 | 0.38 |
322
- | cosine_accuracy@3 | 0.62 | 0.56 |
323
- | cosine_accuracy@5 | 0.7 | 0.62 |
324
- | cosine_accuracy@10 | 0.76 | 0.7 |
325
- | cosine_precision@1 | 0.3 | 0.38 |
326
- | cosine_precision@3 | 0.2067 | 0.1933 |
327
- | cosine_precision@5 | 0.14 | 0.132 |
328
- | cosine_precision@10 | 0.076 | 0.074 |
329
- | cosine_recall@1 | 0.3 | 0.35 |
330
- | cosine_recall@3 | 0.62 | 0.54 |
331
- | cosine_recall@5 | 0.7 | 0.6 |
332
- | cosine_recall@10 | 0.76 | 0.68 |
333
- | **cosine_ndcg@10** | **0.5416** | **0.5219** |
334
- | cosine_mrr@10 | 0.4702 | 0.4853 |
335
- | cosine_map@100 | 0.4817 | 0.4742 |
336
 
337
  #### Nano BEIR
338
 
@@ -350,21 +350,21 @@ You can finetune this model on your own dataset.
350
 
351
  | Metric | Value |
352
  |:--------------------|:-----------|
353
- | cosine_accuracy@1 | 0.34 |
354
- | cosine_accuracy@3 | 0.59 |
355
- | cosine_accuracy@5 | 0.66 |
356
- | cosine_accuracy@10 | 0.73 |
357
- | cosine_precision@1 | 0.34 |
358
- | cosine_precision@3 | 0.2 |
359
- | cosine_precision@5 | 0.136 |
360
- | cosine_precision@10 | 0.075 |
361
- | cosine_recall@1 | 0.325 |
362
- | cosine_recall@3 | 0.58 |
363
- | cosine_recall@5 | 0.65 |
364
- | cosine_recall@10 | 0.72 |
365
- | **cosine_ndcg@10** | **0.5318** |
366
- | cosine_mrr@10 | 0.4778 |
367
- | cosine_map@100 | 0.478 |
368
 
369
  <!--
370
  ## Bias, Risks and Limitations
@@ -438,8 +438,8 @@ You can finetune this model on your own dataset.
438
  - `eval_strategy`: steps
439
  - `per_device_train_batch_size`: 128
440
  - `per_device_eval_batch_size`: 128
441
- - `learning_rate`: 2e-05
442
- - `weight_decay`: 0.0001
443
  - `max_steps`: 3000
444
  - `warmup_ratio`: 0.1
445
  - `fp16`: True
@@ -467,8 +467,8 @@ You can finetune this model on your own dataset.
467
  - `gradient_accumulation_steps`: 1
468
  - `eval_accumulation_steps`: None
469
  - `torch_empty_cache_steps`: None
470
- - `learning_rate`: 2e-05
471
- - `weight_decay`: 0.0001
472
  - `adam_beta1`: 0.9
473
  - `adam_beta2`: 0.999
474
  - `adam_epsilon`: 1e-08
@@ -582,18 +582,18 @@ You can finetune this model on your own dataset.
582
  | Epoch | Step | Training Loss | Validation Loss | NanoMSMARCO_cosine_ndcg@10 | NanoNQ_cosine_ndcg@10 | NanoBEIR_mean_cosine_ndcg@10 |
583
  |:------:|:----:|:-------------:|:---------------:|:--------------------------:|:---------------------:|:----------------------------:|
584
  | 0 | 0 | - | 3.6614 | 0.6259 | 0.6583 | 0.6421 |
585
- | 0.3556 | 250 | 2.1172 | 0.4652 | 0.5662 | 0.5558 | 0.5610 |
586
- | 0.7112 | 500 | 0.5877 | 0.4272 | 0.5926 | 0.5289 | 0.5607 |
587
- | 1.0669 | 750 | 0.5436 | 0.4134 | 0.5476 | 0.5478 | 0.5477 |
588
- | 1.4225 | 1000 | 0.5214 | 0.4041 | 0.5461 | 0.5451 | 0.5456 |
589
- | 1.7781 | 1250 | 0.5119 | 0.3994 | 0.5316 | 0.5377 | 0.5347 |
590
- | 2.1337 | 1500 | 0.5006 | 0.3957 | 0.5357 | 0.5305 | 0.5331 |
591
- | 2.4893 | 1750 | 0.494 | 0.3934 | 0.5444 | 0.5319 | 0.5382 |
592
- | 2.8450 | 2000 | 0.4886 | 0.3906 | 0.5322 | 0.5246 | 0.5284 |
593
- | 3.2006 | 2250 | 0.4839 | 0.3889 | 0.5413 | 0.5307 | 0.5360 |
594
- | 3.5562 | 2500 | 0.4795 | 0.3881 | 0.5490 | 0.5214 | 0.5352 |
595
- | 3.9118 | 2750 | 0.479 | 0.3872 | 0.5413 | 0.5219 | 0.5316 |
596
- | 4.2674 | 3000 | 0.4765 | 0.3869 | 0.5416 | 0.5219 | 0.5318 |
597
 
598
 
599
  ### Framework Versions
 
67
  type: NanoMSMARCO
68
  metrics:
69
  - type: cosine_accuracy@1
70
+ value: 0.36
71
  name: Cosine Accuracy@1
72
  - type: cosine_accuracy@3
73
+ value: 0.6
74
  name: Cosine Accuracy@3
75
  - type: cosine_accuracy@5
76
+ value: 0.68
77
  name: Cosine Accuracy@5
78
  - type: cosine_accuracy@10
79
+ value: 0.78
80
  name: Cosine Accuracy@10
81
  - type: cosine_precision@1
82
+ value: 0.36
83
  name: Cosine Precision@1
84
  - type: cosine_precision@3
85
+ value: 0.2
86
  name: Cosine Precision@3
87
  - type: cosine_precision@5
88
+ value: 0.136
89
  name: Cosine Precision@5
90
  - type: cosine_precision@10
91
+ value: 0.07800000000000001
92
  name: Cosine Precision@10
93
  - type: cosine_recall@1
94
+ value: 0.36
95
  name: Cosine Recall@1
96
  - type: cosine_recall@3
97
+ value: 0.6
98
  name: Cosine Recall@3
99
  - type: cosine_recall@5
100
+ value: 0.68
101
  name: Cosine Recall@5
102
  - type: cosine_recall@10
103
+ value: 0.78
104
  name: Cosine Recall@10
105
  - type: cosine_ndcg@10
106
+ value: 0.5686788105462819
107
  name: Cosine Ndcg@10
108
  - type: cosine_mrr@10
109
+ value: 0.5018888888888889
110
  name: Cosine Mrr@10
111
  - type: cosine_map@100
112
+ value: 0.5110826036192063
113
  name: Cosine Map@100
114
  - task:
115
  type: information-retrieval
 
119
  type: NanoNQ
120
  metrics:
121
  - type: cosine_accuracy@1
122
+ value: 0.36
123
  name: Cosine Accuracy@1
124
  - type: cosine_accuracy@3
125
+ value: 0.66
126
  name: Cosine Accuracy@3
127
  - type: cosine_accuracy@5
128
+ value: 0.68
129
  name: Cosine Accuracy@5
130
  - type: cosine_accuracy@10
131
+ value: 0.76
132
  name: Cosine Accuracy@10
133
  - type: cosine_precision@1
134
+ value: 0.36
135
  name: Cosine Precision@1
136
  - type: cosine_precision@3
137
+ value: 0.22
138
  name: Cosine Precision@3
139
  - type: cosine_precision@5
140
+ value: 0.14
141
  name: Cosine Precision@5
142
  - type: cosine_precision@10
143
+ value: 0.08
144
  name: Cosine Precision@10
145
  - type: cosine_recall@1
146
+ value: 0.33
147
  name: Cosine Recall@1
148
  - type: cosine_recall@3
149
+ value: 0.62
150
  name: Cosine Recall@3
151
  - type: cosine_recall@5
152
+ value: 0.65
153
  name: Cosine Recall@5
154
  - type: cosine_recall@10
155
+ value: 0.72
156
  name: Cosine Recall@10
157
  - type: cosine_ndcg@10
158
+ value: 0.547217901995397
159
  name: Cosine Ndcg@10
160
  - type: cosine_mrr@10
161
+ value: 0.5098571428571428
162
  name: Cosine Mrr@10
163
  - type: cosine_map@100
164
+ value: 0.4872849044614519
165
  name: Cosine Map@100
166
  - task:
167
  type: nano-beir
 
171
  type: NanoBEIR_mean
172
  metrics:
173
  - type: cosine_accuracy@1
174
+ value: 0.36
175
  name: Cosine Accuracy@1
176
  - type: cosine_accuracy@3
177
+ value: 0.63
178
  name: Cosine Accuracy@3
179
  - type: cosine_accuracy@5
180
+ value: 0.68
181
  name: Cosine Accuracy@5
182
  - type: cosine_accuracy@10
183
+ value: 0.77
184
  name: Cosine Accuracy@10
185
  - type: cosine_precision@1
186
+ value: 0.36
187
  name: Cosine Precision@1
188
  - type: cosine_precision@3
189
+ value: 0.21000000000000002
190
  name: Cosine Precision@3
191
  - type: cosine_precision@5
192
+ value: 0.138
193
  name: Cosine Precision@5
194
  - type: cosine_precision@10
195
+ value: 0.07900000000000001
196
  name: Cosine Precision@10
197
  - type: cosine_recall@1
198
+ value: 0.345
199
  name: Cosine Recall@1
200
  - type: cosine_recall@3
201
+ value: 0.61
202
  name: Cosine Recall@3
203
  - type: cosine_recall@5
204
+ value: 0.665
205
  name: Cosine Recall@5
206
  - type: cosine_recall@10
207
+ value: 0.75
208
  name: Cosine Recall@10
209
  - type: cosine_ndcg@10
210
+ value: 0.5579483562708394
211
  name: Cosine Ndcg@10
212
  - type: cosine_mrr@10
213
+ value: 0.5058730158730158
214
  name: Cosine Mrr@10
215
  - type: cosine_map@100
216
+ value: 0.4991837540403291
217
  name: Cosine Map@100
218
  ---
219
 
 
278
  # Get the similarity scores for the embeddings
279
  similarities = model.similarity(embeddings, embeddings)
280
  print(similarities)
281
+ # tensor([[1.0000, 0.7041, 0.1992],
282
+ # [0.7041, 1.0000, 0.0598],
283
+ # [0.1992, 0.0598, 1.0000]])
284
  ```
285
 
286
  <!--
 
318
 
319
  | Metric | NanoMSMARCO | NanoNQ |
320
  |:--------------------|:------------|:-----------|
321
+ | cosine_accuracy@1 | 0.36 | 0.36 |
322
+ | cosine_accuracy@3 | 0.6 | 0.66 |
323
+ | cosine_accuracy@5 | 0.68 | 0.68 |
324
+ | cosine_accuracy@10 | 0.78 | 0.76 |
325
+ | cosine_precision@1 | 0.36 | 0.36 |
326
+ | cosine_precision@3 | 0.2 | 0.22 |
327
+ | cosine_precision@5 | 0.136 | 0.14 |
328
+ | cosine_precision@10 | 0.078 | 0.08 |
329
+ | cosine_recall@1 | 0.36 | 0.33 |
330
+ | cosine_recall@3 | 0.6 | 0.62 |
331
+ | cosine_recall@5 | 0.68 | 0.65 |
332
+ | cosine_recall@10 | 0.78 | 0.72 |
333
+ | **cosine_ndcg@10** | **0.5687** | **0.5472** |
334
+ | cosine_mrr@10 | 0.5019 | 0.5099 |
335
+ | cosine_map@100 | 0.5111 | 0.4873 |
336
 
337
  #### Nano BEIR
338
 
 
350
 
351
  | Metric | Value |
352
  |:--------------------|:-----------|
353
+ | cosine_accuracy@1 | 0.36 |
354
+ | cosine_accuracy@3 | 0.63 |
355
+ | cosine_accuracy@5 | 0.68 |
356
+ | cosine_accuracy@10 | 0.77 |
357
+ | cosine_precision@1 | 0.36 |
358
+ | cosine_precision@3 | 0.21 |
359
+ | cosine_precision@5 | 0.138 |
360
+ | cosine_precision@10 | 0.079 |
361
+ | cosine_recall@1 | 0.345 |
362
+ | cosine_recall@3 | 0.61 |
363
+ | cosine_recall@5 | 0.665 |
364
+ | cosine_recall@10 | 0.75 |
365
+ | **cosine_ndcg@10** | **0.5579** |
366
+ | cosine_mrr@10 | 0.5059 |
367
+ | cosine_map@100 | 0.4992 |
368
 
369
  <!--
370
  ## Bias, Risks and Limitations
 
438
  - `eval_strategy`: steps
439
  - `per_device_train_batch_size`: 128
440
  - `per_device_eval_batch_size`: 128
441
+ - `learning_rate`: 1e-06
442
+ - `weight_decay`: 0.001
443
  - `max_steps`: 3000
444
  - `warmup_ratio`: 0.1
445
  - `fp16`: True
 
467
  - `gradient_accumulation_steps`: 1
468
  - `eval_accumulation_steps`: None
469
  - `torch_empty_cache_steps`: None
470
+ - `learning_rate`: 1e-06
471
+ - `weight_decay`: 0.001
472
  - `adam_beta1`: 0.9
473
  - `adam_beta2`: 0.999
474
  - `adam_epsilon`: 1e-08
 
582
  | Epoch | Step | Training Loss | Validation Loss | NanoMSMARCO_cosine_ndcg@10 | NanoNQ_cosine_ndcg@10 | NanoBEIR_mean_cosine_ndcg@10 |
583
  |:------:|:----:|:-------------:|:---------------:|:--------------------------:|:---------------------:|:----------------------------:|
584
  | 0 | 0 | - | 3.6614 | 0.6259 | 0.6583 | 0.6421 |
585
+ | 0.3556 | 250 | 3.8825 | 3.4013 | 0.6200 | 0.6575 | 0.6388 |
586
+ | 0.7112 | 500 | 3.3083 | 2.1977 | 0.6287 | 0.6387 | 0.6337 |
587
+ | 1.0669 | 750 | 1.7439 | 0.6392 | 0.5543 | 0.5530 | 0.5537 |
588
+ | 1.4225 | 1000 | 0.8977 | 0.5267 | 0.5526 | 0.5274 | 0.5400 |
589
+ | 1.7781 | 1250 | 0.7869 | 0.5083 | 0.5426 | 0.5390 | 0.5408 |
590
+ | 2.1337 | 1500 | 0.7442 | 0.4991 | 0.5412 | 0.5482 | 0.5447 |
591
+ | 2.4893 | 1750 | 0.7213 | 0.4941 | 0.5553 | 0.5484 | 0.5518 |
592
+ | 2.8450 | 2000 | 0.7054 | 0.4872 | 0.5635 | 0.5506 | 0.5571 |
593
+ | 3.2006 | 2250 | 0.6943 | 0.4863 | 0.5696 | 0.5503 | 0.5599 |
594
+ | 3.5562 | 2500 | 0.6864 | 0.4839 | 0.5681 | 0.5472 | 0.5576 |
595
+ | 3.9118 | 2750 | 0.6851 | 0.4832 | 0.5687 | 0.5472 | 0.5579 |
596
+ | 4.2674 | 3000 | 0.6825 | 0.4825 | 0.5687 | 0.5472 | 0.5579 |
597
 
598
 
599
  ### Framework Versions