radoslavralev commited on
Commit
df8cabd
·
verified ·
1 Parent(s): 477c33b

Add new SentenceTransformer model

Browse files
Files changed (2) hide show
  1. README.md +112 -99
  2. config_sentence_transformers.json +1 -1
README.md CHANGED
@@ -7,7 +7,7 @@ tags:
7
  - generated_from_trainer
8
  - dataset_size:111470
9
  - loss:MultipleNegativesRankingLoss
10
- base_model: thenlper/gte-small
11
  widget:
12
  - source_sentence: why are some rocks radioactive
13
  sentences:
@@ -106,7 +106,7 @@ metrics:
106
  - cosine_mrr@10
107
  - cosine_map@100
108
  model-index:
109
- - name: SentenceTransformer based on thenlper/gte-small
110
  results:
111
  - task:
112
  type: information-retrieval
@@ -116,49 +116,49 @@ model-index:
116
  type: NanoMSMARCO
117
  metrics:
118
  - type: cosine_accuracy@1
119
- value: 0.38
120
  name: Cosine Accuracy@1
121
  - type: cosine_accuracy@3
122
- value: 0.6
123
  name: Cosine Accuracy@3
124
  - type: cosine_accuracy@5
125
- value: 0.66
126
  name: Cosine Accuracy@5
127
  - type: cosine_accuracy@10
128
  value: 0.68
129
  name: Cosine Accuracy@10
130
  - type: cosine_precision@1
131
- value: 0.38
132
  name: Cosine Precision@1
133
  - type: cosine_precision@3
134
- value: 0.2
135
  name: Cosine Precision@3
136
  - type: cosine_precision@5
137
- value: 0.132
138
  name: Cosine Precision@5
139
  - type: cosine_precision@10
140
  value: 0.068
141
  name: Cosine Precision@10
142
  - type: cosine_recall@1
143
- value: 0.38
144
  name: Cosine Recall@1
145
  - type: cosine_recall@3
146
- value: 0.6
147
  name: Cosine Recall@3
148
  - type: cosine_recall@5
149
- value: 0.66
150
  name: Cosine Recall@5
151
  - type: cosine_recall@10
152
  value: 0.68
153
  name: Cosine Recall@10
154
  - type: cosine_ndcg@10
155
- value: 0.5369233576215849
156
  name: Cosine Ndcg@10
157
  - type: cosine_mrr@10
158
- value: 0.48966666666666664
159
  name: Cosine Mrr@10
160
  - type: cosine_map@100
161
- value: 0.5049307222721455
162
  name: Cosine Map@100
163
  - task:
164
  type: information-retrieval
@@ -168,49 +168,49 @@ model-index:
168
  type: NanoNQ
169
  metrics:
170
  - type: cosine_accuracy@1
171
- value: 0.42
172
  name: Cosine Accuracy@1
173
  - type: cosine_accuracy@3
174
- value: 0.56
175
  name: Cosine Accuracy@3
176
  - type: cosine_accuracy@5
177
- value: 0.62
178
  name: Cosine Accuracy@5
179
  - type: cosine_accuracy@10
180
- value: 0.74
181
  name: Cosine Accuracy@10
182
  - type: cosine_precision@1
183
- value: 0.42
184
  name: Cosine Precision@1
185
  - type: cosine_precision@3
186
- value: 0.19333333333333333
187
  name: Cosine Precision@3
188
  - type: cosine_precision@5
189
- value: 0.128
190
  name: Cosine Precision@5
191
  - type: cosine_precision@10
192
- value: 0.07600000000000001
193
  name: Cosine Precision@10
194
  - type: cosine_recall@1
195
- value: 0.39
196
  name: Cosine Recall@1
197
  - type: cosine_recall@3
198
- value: 0.53
199
  name: Cosine Recall@3
200
  - type: cosine_recall@5
201
- value: 0.59
202
  name: Cosine Recall@5
203
  - type: cosine_recall@10
204
- value: 0.69
205
  name: Cosine Recall@10
206
  - type: cosine_ndcg@10
207
- value: 0.5406765177061442
208
  name: Cosine Ndcg@10
209
  - type: cosine_mrr@10
210
- value: 0.5126031746031746
211
  name: Cosine Mrr@10
212
  - type: cosine_map@100
213
- value: 0.49920094784101693
214
  name: Cosine Map@100
215
  - task:
216
  type: nano-beir
@@ -220,61 +220,61 @@ model-index:
220
  type: NanoBEIR_mean
221
  metrics:
222
  - type: cosine_accuracy@1
223
- value: 0.4
224
  name: Cosine Accuracy@1
225
  - type: cosine_accuracy@3
226
- value: 0.5800000000000001
227
  name: Cosine Accuracy@3
228
  - type: cosine_accuracy@5
229
- value: 0.64
230
  name: Cosine Accuracy@5
231
  - type: cosine_accuracy@10
232
- value: 0.71
233
  name: Cosine Accuracy@10
234
  - type: cosine_precision@1
235
- value: 0.4
236
  name: Cosine Precision@1
237
  - type: cosine_precision@3
238
- value: 0.19666666666666666
239
  name: Cosine Precision@3
240
  - type: cosine_precision@5
241
- value: 0.13
242
  name: Cosine Precision@5
243
  - type: cosine_precision@10
244
- value: 0.07200000000000001
245
  name: Cosine Precision@10
246
  - type: cosine_recall@1
247
- value: 0.385
248
  name: Cosine Recall@1
249
  - type: cosine_recall@3
250
- value: 0.565
251
  name: Cosine Recall@3
252
  - type: cosine_recall@5
253
- value: 0.625
254
  name: Cosine Recall@5
255
  - type: cosine_recall@10
256
- value: 0.685
257
  name: Cosine Recall@10
258
  - type: cosine_ndcg@10
259
- value: 0.5387999376638646
260
  name: Cosine Ndcg@10
261
  - type: cosine_mrr@10
262
- value: 0.5011349206349206
263
  name: Cosine Mrr@10
264
  - type: cosine_map@100
265
- value: 0.5020658350565812
266
  name: Cosine Map@100
267
  ---
268
 
269
- # SentenceTransformer based on thenlper/gte-small
270
 
271
- This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [thenlper/gte-small](https://huggingface.co/thenlper/gte-small). It maps sentences & paragraphs to a 384-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
272
 
273
  ## Model Details
274
 
275
  ### Model Description
276
  - **Model Type:** Sentence Transformer
277
- - **Base model:** [thenlper/gte-small](https://huggingface.co/thenlper/gte-small) <!-- at revision 17e1f347d17fe144873b1201da91788898c639cd -->
278
  - **Maximum Sequence Length:** 128 tokens
279
  - **Output Dimensionality:** 384 dimensions
280
  - **Similarity Function:** Cosine Similarity
@@ -327,9 +327,9 @@ print(embeddings.shape)
327
  # Get the similarity scores for the embeddings
328
  similarities = model.similarity(embeddings, embeddings)
329
  print(similarities)
330
- # tensor([[1.0001, 1.0001, 0.9814],
331
- # [1.0001, 1.0001, 0.9814],
332
- # [0.9814, 0.9814, 1.0000]])
333
  ```
334
 
335
  <!--
@@ -367,21 +367,21 @@ You can finetune this model on your own dataset.
367
 
368
  | Metric | NanoMSMARCO | NanoNQ |
369
  |:--------------------|:------------|:-----------|
370
- | cosine_accuracy@1 | 0.38 | 0.42 |
371
- | cosine_accuracy@3 | 0.6 | 0.56 |
372
- | cosine_accuracy@5 | 0.66 | 0.62 |
373
- | cosine_accuracy@10 | 0.68 | 0.74 |
374
- | cosine_precision@1 | 0.38 | 0.42 |
375
- | cosine_precision@3 | 0.2 | 0.1933 |
376
- | cosine_precision@5 | 0.132 | 0.128 |
377
- | cosine_precision@10 | 0.068 | 0.076 |
378
- | cosine_recall@1 | 0.38 | 0.39 |
379
- | cosine_recall@3 | 0.6 | 0.53 |
380
- | cosine_recall@5 | 0.66 | 0.59 |
381
- | cosine_recall@10 | 0.68 | 0.69 |
382
- | **cosine_ndcg@10** | **0.5369** | **0.5407** |
383
- | cosine_mrr@10 | 0.4897 | 0.5126 |
384
- | cosine_map@100 | 0.5049 | 0.4992 |
385
 
386
  #### Nano BEIR
387
 
@@ -397,23 +397,23 @@ You can finetune this model on your own dataset.
397
  }
398
  ```
399
 
400
- | Metric | Value |
401
- |:--------------------|:-----------|
402
- | cosine_accuracy@1 | 0.4 |
403
- | cosine_accuracy@3 | 0.58 |
404
- | cosine_accuracy@5 | 0.64 |
405
- | cosine_accuracy@10 | 0.71 |
406
- | cosine_precision@1 | 0.4 |
407
- | cosine_precision@3 | 0.1967 |
408
- | cosine_precision@5 | 0.13 |
409
- | cosine_precision@10 | 0.072 |
410
- | cosine_recall@1 | 0.385 |
411
- | cosine_recall@3 | 0.565 |
412
- | cosine_recall@5 | 0.625 |
413
- | cosine_recall@10 | 0.685 |
414
- | **cosine_ndcg@10** | **0.5388** |
415
- | cosine_mrr@10 | 0.5011 |
416
- | cosine_map@100 | 0.5021 |
417
 
418
  <!--
419
  ## Bias, Risks and Limitations
@@ -487,9 +487,9 @@ You can finetune this model on your own dataset.
487
  - `eval_strategy`: steps
488
  - `per_device_train_batch_size`: 128
489
  - `per_device_eval_batch_size`: 128
490
- - `learning_rate`: 8e-05
491
- - `weight_decay`: 0.005
492
- - `max_steps`: 1687
493
  - `warmup_ratio`: 0.1
494
  - `fp16`: True
495
  - `dataloader_drop_last`: True
@@ -516,14 +516,14 @@ You can finetune this model on your own dataset.
516
  - `gradient_accumulation_steps`: 1
517
  - `eval_accumulation_steps`: None
518
  - `torch_empty_cache_steps`: None
519
- - `learning_rate`: 8e-05
520
- - `weight_decay`: 0.005
521
  - `adam_beta1`: 0.9
522
  - `adam_beta2`: 0.999
523
  - `adam_epsilon`: 1e-08
524
  - `max_grad_norm`: 1.0
525
  - `num_train_epochs`: 3.0
526
- - `max_steps`: 1687
527
  - `lr_scheduler_type`: linear
528
  - `lr_scheduler_kwargs`: {}
529
  - `warmup_ratio`: 0.1
@@ -628,17 +628,30 @@ You can finetune this model on your own dataset.
628
  </details>
629
 
630
  ### Training Logs
631
- | Epoch | Step | Training Loss | Validation Loss | NanoMSMARCO_cosine_ndcg@10 | NanoNQ_cosine_ndcg@10 | NanoBEIR_mean_cosine_ndcg@10 |
632
- |:----------:|:-------:|:-------------:|:---------------:|:--------------------------:|:---------------------:|:----------------------------:|
633
- | 0 | 0 | - | 4.0678 | 0.6259 | 0.6583 | 0.6421 |
634
- | 0.2874 | 250 | 1.7031 | 0.8455 | 0.5349 | 0.5337 | 0.5343 |
635
- | **0.5747** | **500** | **0.949** | **0.8059** | **0.5292** | **0.5546** | **0.5419** |
636
- | 0.8621 | 750 | 0.9183 | 0.7856 | 0.5325 | 0.5433 | 0.5379 |
637
- | 1.1494 | 1000 | 0.8561 | 0.7834 | 0.5132 | 0.5408 | 0.5270 |
638
- | 1.4368 | 1250 | 0.8156 | 0.7782 | 0.5150 | 0.5353 | 0.5252 |
639
- | 1.7241 | 1500 | 0.8064 | 0.7715 | 0.5369 | 0.5407 | 0.5388 |
640
-
641
- * The bold row denotes the saved checkpoint.
 
 
 
 
 
 
 
 
 
 
 
 
 
642
 
643
  ### Framework Versions
644
  - Python: 3.10.18
 
7
  - generated_from_trainer
8
  - dataset_size:111470
9
  - loss:MultipleNegativesRankingLoss
10
+ base_model: sentence-transformers/all-MiniLM-L6-v2
11
  widget:
12
  - source_sentence: why are some rocks radioactive
13
  sentences:
 
106
  - cosine_mrr@10
107
  - cosine_map@100
108
  model-index:
109
+ - name: SentenceTransformer based on sentence-transformers/all-MiniLM-L6-v2
110
  results:
111
  - task:
112
  type: information-retrieval
 
116
  type: NanoMSMARCO
117
  metrics:
118
  - type: cosine_accuracy@1
119
+ value: 0.3
120
  name: Cosine Accuracy@1
121
  - type: cosine_accuracy@3
122
+ value: 0.5
123
  name: Cosine Accuracy@3
124
  - type: cosine_accuracy@5
125
+ value: 0.58
126
  name: Cosine Accuracy@5
127
  - type: cosine_accuracy@10
128
  value: 0.68
129
  name: Cosine Accuracy@10
130
  - type: cosine_precision@1
131
+ value: 0.3
132
  name: Cosine Precision@1
133
  - type: cosine_precision@3
134
+ value: 0.16666666666666669
135
  name: Cosine Precision@3
136
  - type: cosine_precision@5
137
+ value: 0.11599999999999999
138
  name: Cosine Precision@5
139
  - type: cosine_precision@10
140
  value: 0.068
141
  name: Cosine Precision@10
142
  - type: cosine_recall@1
143
+ value: 0.3
144
  name: Cosine Recall@1
145
  - type: cosine_recall@3
146
+ value: 0.5
147
  name: Cosine Recall@3
148
  - type: cosine_recall@5
149
+ value: 0.58
150
  name: Cosine Recall@5
151
  - type: cosine_recall@10
152
  value: 0.68
153
  name: Cosine Recall@10
154
  - type: cosine_ndcg@10
155
+ value: 0.48741389266955737
156
  name: Cosine Ndcg@10
157
  - type: cosine_mrr@10
158
+ value: 0.4262222222222222
159
  name: Cosine Mrr@10
160
  - type: cosine_map@100
161
+ value: 0.44072094685707097
162
  name: Cosine Map@100
163
  - task:
164
  type: information-retrieval
 
168
  type: NanoNQ
169
  metrics:
170
  - type: cosine_accuracy@1
171
+ value: 0.26
172
  name: Cosine Accuracy@1
173
  - type: cosine_accuracy@3
174
+ value: 0.4
175
  name: Cosine Accuracy@3
176
  - type: cosine_accuracy@5
177
+ value: 0.48
178
  name: Cosine Accuracy@5
179
  - type: cosine_accuracy@10
180
+ value: 0.54
181
  name: Cosine Accuracy@10
182
  - type: cosine_precision@1
183
+ value: 0.26
184
  name: Cosine Precision@1
185
  - type: cosine_precision@3
186
+ value: 0.14
187
  name: Cosine Precision@3
188
  - type: cosine_precision@5
189
+ value: 0.1
190
  name: Cosine Precision@5
191
  - type: cosine_precision@10
192
+ value: 0.05600000000000001
193
  name: Cosine Precision@10
194
  - type: cosine_recall@1
195
+ value: 0.23
196
  name: Cosine Recall@1
197
  - type: cosine_recall@3
198
+ value: 0.37
199
  name: Cosine Recall@3
200
  - type: cosine_recall@5
201
+ value: 0.45
202
  name: Cosine Recall@5
203
  - type: cosine_recall@10
204
+ value: 0.51
205
  name: Cosine Recall@10
206
  - type: cosine_ndcg@10
207
+ value: 0.3745207998751907
208
  name: Cosine Ndcg@10
209
  - type: cosine_mrr@10
210
+ value: 0.35074603174603175
211
  name: Cosine Mrr@10
212
  - type: cosine_map@100
213
+ value: 0.3364191132763434
214
  name: Cosine Map@100
215
  - task:
216
  type: nano-beir
 
220
  type: NanoBEIR_mean
221
  metrics:
222
  - type: cosine_accuracy@1
223
+ value: 0.28
224
  name: Cosine Accuracy@1
225
  - type: cosine_accuracy@3
226
+ value: 0.45
227
  name: Cosine Accuracy@3
228
  - type: cosine_accuracy@5
229
+ value: 0.53
230
  name: Cosine Accuracy@5
231
  - type: cosine_accuracy@10
232
+ value: 0.6100000000000001
233
  name: Cosine Accuracy@10
234
  - type: cosine_precision@1
235
+ value: 0.28
236
  name: Cosine Precision@1
237
  - type: cosine_precision@3
238
+ value: 0.15333333333333335
239
  name: Cosine Precision@3
240
  - type: cosine_precision@5
241
+ value: 0.108
242
  name: Cosine Precision@5
243
  - type: cosine_precision@10
244
+ value: 0.062000000000000006
245
  name: Cosine Precision@10
246
  - type: cosine_recall@1
247
+ value: 0.265
248
  name: Cosine Recall@1
249
  - type: cosine_recall@3
250
+ value: 0.435
251
  name: Cosine Recall@3
252
  - type: cosine_recall@5
253
+ value: 0.515
254
  name: Cosine Recall@5
255
  - type: cosine_recall@10
256
+ value: 0.595
257
  name: Cosine Recall@10
258
  - type: cosine_ndcg@10
259
+ value: 0.43096734627237404
260
  name: Cosine Ndcg@10
261
  - type: cosine_mrr@10
262
+ value: 0.388484126984127
263
  name: Cosine Mrr@10
264
  - type: cosine_map@100
265
+ value: 0.3885700300667072
266
  name: Cosine Map@100
267
  ---
268
 
269
+ # SentenceTransformer based on sentence-transformers/all-MiniLM-L6-v2
270
 
271
+ This is a [sentence-transformers](https://www.SBERT.net) model finetuned from [sentence-transformers/all-MiniLM-L6-v2](https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2). It maps sentences & paragraphs to a 384-dimensional dense vector space and can be used for semantic textual similarity, semantic search, paraphrase mining, text classification, clustering, and more.
272
 
273
  ## Model Details
274
 
275
  ### Model Description
276
  - **Model Type:** Sentence Transformer
277
+ - **Base model:** [sentence-transformers/all-MiniLM-L6-v2](https://huggingface.co/sentence-transformers/all-MiniLM-L6-v2) <!-- at revision c9745ed1d9f207416be6d2e6f8de32d1f16199bf -->
278
  - **Maximum Sequence Length:** 128 tokens
279
  - **Output Dimensionality:** 384 dimensions
280
  - **Similarity Function:** Cosine Similarity
 
327
  # Get the similarity scores for the embeddings
328
  similarities = model.similarity(embeddings, embeddings)
329
  print(similarities)
330
+ # tensor([[1.0000, 1.0000, 0.9587],
331
+ # [1.0000, 1.0000, 0.9587],
332
+ # [0.9587, 0.9587, 1.0000]])
333
  ```
334
 
335
  <!--
 
367
 
368
  | Metric | NanoMSMARCO | NanoNQ |
369
  |:--------------------|:------------|:-----------|
370
+ | cosine_accuracy@1 | 0.3 | 0.26 |
371
+ | cosine_accuracy@3 | 0.5 | 0.4 |
372
+ | cosine_accuracy@5 | 0.58 | 0.48 |
373
+ | cosine_accuracy@10 | 0.68 | 0.54 |
374
+ | cosine_precision@1 | 0.3 | 0.26 |
375
+ | cosine_precision@3 | 0.1667 | 0.14 |
376
+ | cosine_precision@5 | 0.116 | 0.1 |
377
+ | cosine_precision@10 | 0.068 | 0.056 |
378
+ | cosine_recall@1 | 0.3 | 0.23 |
379
+ | cosine_recall@3 | 0.5 | 0.37 |
380
+ | cosine_recall@5 | 0.58 | 0.45 |
381
+ | cosine_recall@10 | 0.68 | 0.51 |
382
+ | **cosine_ndcg@10** | **0.4874** | **0.3745** |
383
+ | cosine_mrr@10 | 0.4262 | 0.3507 |
384
+ | cosine_map@100 | 0.4407 | 0.3364 |
385
 
386
  #### Nano BEIR
387
 
 
397
  }
398
  ```
399
 
400
+ | Metric | Value |
401
+ |:--------------------|:----------|
402
+ | cosine_accuracy@1 | 0.28 |
403
+ | cosine_accuracy@3 | 0.45 |
404
+ | cosine_accuracy@5 | 0.53 |
405
+ | cosine_accuracy@10 | 0.61 |
406
+ | cosine_precision@1 | 0.28 |
407
+ | cosine_precision@3 | 0.1533 |
408
+ | cosine_precision@5 | 0.108 |
409
+ | cosine_precision@10 | 0.062 |
410
+ | cosine_recall@1 | 0.265 |
411
+ | cosine_recall@3 | 0.435 |
412
+ | cosine_recall@5 | 0.515 |
413
+ | cosine_recall@10 | 0.595 |
414
+ | **cosine_ndcg@10** | **0.431** |
415
+ | cosine_mrr@10 | 0.3885 |
416
+ | cosine_map@100 | 0.3886 |
417
 
418
  <!--
419
  ## Bias, Risks and Limitations
 
487
  - `eval_strategy`: steps
488
  - `per_device_train_batch_size`: 128
489
  - `per_device_eval_batch_size`: 128
490
+ - `learning_rate`: 0.0001
491
+ - `weight_decay`: 0.001
492
+ - `max_steps`: 5062
493
  - `warmup_ratio`: 0.1
494
  - `fp16`: True
495
  - `dataloader_drop_last`: True
 
516
  - `gradient_accumulation_steps`: 1
517
  - `eval_accumulation_steps`: None
518
  - `torch_empty_cache_steps`: None
519
+ - `learning_rate`: 0.0001
520
+ - `weight_decay`: 0.001
521
  - `adam_beta1`: 0.9
522
  - `adam_beta2`: 0.999
523
  - `adam_epsilon`: 1e-08
524
  - `max_grad_norm`: 1.0
525
  - `num_train_epochs`: 3.0
526
+ - `max_steps`: 5062
527
  - `lr_scheduler_type`: linear
528
  - `lr_scheduler_kwargs`: {}
529
  - `warmup_ratio`: 0.1
 
628
  </details>
629
 
630
  ### Training Logs
631
+ | Epoch | Step | Training Loss | Validation Loss | NanoMSMARCO_cosine_ndcg@10 | NanoNQ_cosine_ndcg@10 | NanoBEIR_mean_cosine_ndcg@10 |
632
+ |:------:|:----:|:-------------:|:---------------:|:--------------------------:|:---------------------:|:----------------------------:|
633
+ | 0 | 0 | - | 1.1445 | 0.5540 | 0.5931 | 0.5735 |
634
+ | 0.2874 | 250 | 1.1025 | 0.8649 | 0.4839 | 0.5173 | 0.5006 |
635
+ | 0.5747 | 500 | 0.9965 | 0.8468 | 0.5015 | 0.4853 | 0.4934 |
636
+ | 0.8621 | 750 | 0.9723 | 0.8249 | 0.5063 | 0.4415 | 0.4739 |
637
+ | 1.1494 | 1000 | 0.9091 | 0.8153 | 0.4996 | 0.4265 | 0.4630 |
638
+ | 1.4368 | 1250 | 0.868 | 0.8118 | 0.5418 | 0.4201 | 0.4809 |
639
+ | 1.7241 | 1500 | 0.863 | 0.8032 | 0.5073 | 0.4010 | 0.4542 |
640
+ | 2.0115 | 1750 | 0.8557 | 0.8096 | 0.5121 | 0.3922 | 0.4521 |
641
+ | 2.2989 | 2000 | 0.7687 | 0.8067 | 0.4885 | 0.3905 | 0.4395 |
642
+ | 2.5862 | 2250 | 0.7718 | 0.8011 | 0.4848 | 0.3960 | 0.4404 |
643
+ | 2.8736 | 2500 | 0.7648 | 0.8022 | 0.4765 | 0.4119 | 0.4442 |
644
+ | 3.1609 | 2750 | 0.7339 | 0.8176 | 0.4813 | 0.3885 | 0.4349 |
645
+ | 3.4483 | 3000 | 0.7055 | 0.8101 | 0.4753 | 0.3991 | 0.4372 |
646
+ | 3.7356 | 3250 | 0.7065 | 0.8195 | 0.5022 | 0.3715 | 0.4368 |
647
+ | 4.0230 | 3500 | 0.7014 | 0.8258 | 0.5272 | 0.3856 | 0.4564 |
648
+ | 4.3103 | 3750 | 0.6601 | 0.8191 | 0.4957 | 0.3766 | 0.4361 |
649
+ | 4.5977 | 4000 | 0.6632 | 0.8264 | 0.4649 | 0.3741 | 0.4195 |
650
+ | 4.8851 | 4250 | 0.664 | 0.8191 | 0.4954 | 0.3662 | 0.4308 |
651
+ | 5.1724 | 4500 | 0.6422 | 0.8277 | 0.4851 | 0.3749 | 0.4300 |
652
+ | 5.4598 | 4750 | 0.6336 | 0.8296 | 0.4855 | 0.3725 | 0.4290 |
653
+ | 5.7471 | 5000 | 0.6316 | 0.8279 | 0.4874 | 0.3745 | 0.4310 |
654
+
655
 
656
  ### Framework Versions
657
  - Python: 3.10.18
config_sentence_transformers.json CHANGED
@@ -1,10 +1,10 @@
1
  {
2
- "model_type": "SentenceTransformer",
3
  "__version__": {
4
  "sentence_transformers": "5.2.0",
5
  "transformers": "4.57.3",
6
  "pytorch": "2.9.1+cu128"
7
  },
 
8
  "prompts": {
9
  "query": "",
10
  "document": ""
 
1
  {
 
2
  "__version__": {
3
  "sentence_transformers": "5.2.0",
4
  "transformers": "4.57.3",
5
  "pytorch": "2.9.1+cu128"
6
  },
7
+ "model_type": "SentenceTransformer",
8
  "prompts": {
9
  "query": "",
10
  "document": ""