Update README.md
Browse files
README.md
CHANGED
|
@@ -27,7 +27,7 @@ model-index:
|
|
| 27 |
type: mteb/amazon_counterfactual
|
| 28 |
metrics:
|
| 29 |
- type: accuracy
|
| 30 |
-
value:
|
| 31 |
task:
|
| 32 |
type: Classification
|
| 33 |
- dataset:
|
|
@@ -38,7 +38,7 @@ model-index:
|
|
| 38 |
type: mteb/amazon_counterfactual
|
| 39 |
metrics:
|
| 40 |
- type: accuracy
|
| 41 |
-
value:
|
| 42 |
task:
|
| 43 |
type: Classification
|
| 44 |
- dataset:
|
|
@@ -49,7 +49,7 @@ model-index:
|
|
| 49 |
type: mteb/amazon_reviews_multi
|
| 50 |
metrics:
|
| 51 |
- type: accuracy
|
| 52 |
-
value:
|
| 53 |
task:
|
| 54 |
type: Classification
|
| 55 |
- dataset:
|
|
@@ -60,7 +60,7 @@ model-index:
|
|
| 60 |
type: mteb/amazon_reviews_multi
|
| 61 |
metrics:
|
| 62 |
- type: accuracy
|
| 63 |
-
value:
|
| 64 |
task:
|
| 65 |
type: Classification
|
| 66 |
- dataset:
|
|
@@ -71,7 +71,7 @@ model-index:
|
|
| 71 |
type: slvnwhrl/blurbs-clustering-p2p
|
| 72 |
metrics:
|
| 73 |
- type: v_measure
|
| 74 |
-
value:
|
| 75 |
task:
|
| 76 |
type: Clustering
|
| 77 |
- dataset:
|
|
@@ -82,7 +82,7 @@ model-index:
|
|
| 82 |
type: slvnwhrl/blurbs-clustering-s2s
|
| 83 |
metrics:
|
| 84 |
- type: v_measure
|
| 85 |
-
value:
|
| 86 |
task:
|
| 87 |
type: Clustering
|
| 88 |
- dataset:
|
|
@@ -93,7 +93,7 @@ model-index:
|
|
| 93 |
type: deepset/germandpr
|
| 94 |
metrics:
|
| 95 |
- type: ndcg_at_10
|
| 96 |
-
value:
|
| 97 |
task:
|
| 98 |
type: Retrieval
|
| 99 |
- dataset:
|
|
@@ -104,7 +104,7 @@ model-index:
|
|
| 104 |
type: mteb/germanquad-retrieval
|
| 105 |
metrics:
|
| 106 |
- type: mrr_at_5
|
| 107 |
-
value:
|
| 108 |
task:
|
| 109 |
type: Retrieval
|
| 110 |
- dataset:
|
|
@@ -115,7 +115,7 @@ model-index:
|
|
| 115 |
type: jinaai/german-STSbenchmark
|
| 116 |
metrics:
|
| 117 |
- type: cos_sim_spearman
|
| 118 |
-
value:
|
| 119 |
task:
|
| 120 |
type: STS
|
| 121 |
- dataset:
|
|
@@ -126,7 +126,7 @@ model-index:
|
|
| 126 |
type: jinaai/german-STSbenchmark
|
| 127 |
metrics:
|
| 128 |
- type: cos_sim_spearman
|
| 129 |
-
value:
|
| 130 |
task:
|
| 131 |
type: STS
|
| 132 |
- dataset:
|
|
@@ -137,7 +137,7 @@ model-index:
|
|
| 137 |
type: mteb/amazon_massive_intent
|
| 138 |
metrics:
|
| 139 |
- type: accuracy
|
| 140 |
-
value:
|
| 141 |
task:
|
| 142 |
type: Classification
|
| 143 |
- dataset:
|
|
@@ -148,7 +148,7 @@ model-index:
|
|
| 148 |
type: mteb/amazon_massive_intent
|
| 149 |
metrics:
|
| 150 |
- type: accuracy
|
| 151 |
-
value:
|
| 152 |
task:
|
| 153 |
type: Classification
|
| 154 |
- dataset:
|
|
@@ -159,7 +159,7 @@ model-index:
|
|
| 159 |
type: mteb/amazon_massive_scenario
|
| 160 |
metrics:
|
| 161 |
- type: accuracy
|
| 162 |
-
value:
|
| 163 |
task:
|
| 164 |
type: Classification
|
| 165 |
- dataset:
|
|
@@ -170,7 +170,7 @@ model-index:
|
|
| 170 |
type: mteb/amazon_massive_scenario
|
| 171 |
metrics:
|
| 172 |
- type: accuracy
|
| 173 |
-
value:
|
| 174 |
task:
|
| 175 |
type: Classification
|
| 176 |
- dataset:
|
|
@@ -181,7 +181,7 @@ model-index:
|
|
| 181 |
type: mteb/mtop_domain
|
| 182 |
metrics:
|
| 183 |
- type: accuracy
|
| 184 |
-
value:
|
| 185 |
task:
|
| 186 |
type: Classification
|
| 187 |
- dataset:
|
|
@@ -192,7 +192,7 @@ model-index:
|
|
| 192 |
type: mteb/mtop_domain
|
| 193 |
metrics:
|
| 194 |
- type: accuracy
|
| 195 |
-
value:
|
| 196 |
task:
|
| 197 |
type: Classification
|
| 198 |
- dataset:
|
|
@@ -203,7 +203,7 @@ model-index:
|
|
| 203 |
type: mteb/mtop_intent
|
| 204 |
metrics:
|
| 205 |
- type: accuracy
|
| 206 |
-
value:
|
| 207 |
task:
|
| 208 |
type: Classification
|
| 209 |
- dataset:
|
|
@@ -214,7 +214,7 @@ model-index:
|
|
| 214 |
type: mteb/mtop_intent
|
| 215 |
metrics:
|
| 216 |
- type: accuracy
|
| 217 |
-
value:
|
| 218 |
task:
|
| 219 |
type: Classification
|
| 220 |
- dataset:
|
|
@@ -225,7 +225,7 @@ model-index:
|
|
| 225 |
type: google-research-datasets/paws-x
|
| 226 |
metrics:
|
| 227 |
- type: ap
|
| 228 |
-
value:
|
| 229 |
task:
|
| 230 |
type: PairClassification
|
| 231 |
- dataset:
|
|
@@ -236,7 +236,7 @@ model-index:
|
|
| 236 |
type: google-research-datasets/paws-x
|
| 237 |
metrics:
|
| 238 |
- type: ap
|
| 239 |
-
value:
|
| 240 |
task:
|
| 241 |
type: PairClassification
|
| 242 |
- dataset:
|
|
@@ -247,7 +247,7 @@ model-index:
|
|
| 247 |
type: mteb/sts22-crosslingual-sts
|
| 248 |
metrics:
|
| 249 |
- type: cos_sim_spearman
|
| 250 |
-
value:
|
| 251 |
task:
|
| 252 |
type: STS
|
| 253 |
- dataset:
|
|
@@ -258,7 +258,7 @@ model-index:
|
|
| 258 |
type: slvnwhrl/tenkgnad-clustering-p2p
|
| 259 |
metrics:
|
| 260 |
- type: v_measure
|
| 261 |
-
value:
|
| 262 |
task:
|
| 263 |
type: Clustering
|
| 264 |
- dataset:
|
|
@@ -269,7 +269,7 @@ model-index:
|
|
| 269 |
type: slvnwhrl/tenkgnad-clustering-s2s
|
| 270 |
metrics:
|
| 271 |
- type: v_measure
|
| 272 |
-
value:
|
| 273 |
task:
|
| 274 |
type: Clustering
|
| 275 |
- dataset:
|
|
@@ -280,7 +280,7 @@ model-index:
|
|
| 280 |
type: aari1995/false_friends_de_en_mteb
|
| 281 |
metrics:
|
| 282 |
- type: ap
|
| 283 |
-
value:
|
| 284 |
task:
|
| 285 |
type: PairClassification
|
| 286 |
- dataset:
|
|
@@ -291,7 +291,7 @@ model-index:
|
|
| 291 |
type: jinaai/german-STSbenchmark
|
| 292 |
metrics:
|
| 293 |
- type: cos_sim_spearman
|
| 294 |
-
value:
|
| 295 |
task:
|
| 296 |
type: STS
|
| 297 |
- dataset:
|
|
@@ -302,7 +302,7 @@ model-index:
|
|
| 302 |
type: jinaai/german-STSbenchmark
|
| 303 |
metrics:
|
| 304 |
- type: cos_sim_spearman
|
| 305 |
-
value:
|
| 306 |
task:
|
| 307 |
type: STS
|
| 308 |
---
|
|
|
|
| 27 |
type: mteb/amazon_counterfactual
|
| 28 |
metrics:
|
| 29 |
- type: accuracy
|
| 30 |
+
value: 67.00214132762312
|
| 31 |
task:
|
| 32 |
type: Classification
|
| 33 |
- dataset:
|
|
|
|
| 38 |
type: mteb/amazon_counterfactual
|
| 39 |
metrics:
|
| 40 |
- type: accuracy
|
| 41 |
+
value: 68.43347639484978
|
| 42 |
task:
|
| 43 |
type: Classification
|
| 44 |
- dataset:
|
|
|
|
| 49 |
type: mteb/amazon_reviews_multi
|
| 50 |
metrics:
|
| 51 |
- type: accuracy
|
| 52 |
+
value: 39.092
|
| 53 |
task:
|
| 54 |
type: Classification
|
| 55 |
- dataset:
|
|
|
|
| 60 |
type: mteb/amazon_reviews_multi
|
| 61 |
metrics:
|
| 62 |
- type: accuracy
|
| 63 |
+
value: 39.146000000000003
|
| 64 |
task:
|
| 65 |
type: Classification
|
| 66 |
- dataset:
|
|
|
|
| 71 |
type: slvnwhrl/blurbs-clustering-p2p
|
| 72 |
metrics:
|
| 73 |
- type: v_measure
|
| 74 |
+
value: 38.680981669842135
|
| 75 |
task:
|
| 76 |
type: Clustering
|
| 77 |
- dataset:
|
|
|
|
| 82 |
type: slvnwhrl/blurbs-clustering-s2s
|
| 83 |
metrics:
|
| 84 |
- type: v_measure
|
| 85 |
+
value: 17.624489937027504
|
| 86 |
task:
|
| 87 |
type: Clustering
|
| 88 |
- dataset:
|
|
|
|
| 93 |
type: deepset/germandpr
|
| 94 |
metrics:
|
| 95 |
- type: ndcg_at_10
|
| 96 |
+
value: 72.921
|
| 97 |
task:
|
| 98 |
type: Retrieval
|
| 99 |
- dataset:
|
|
|
|
| 104 |
type: mteb/germanquad-retrieval
|
| 105 |
metrics:
|
| 106 |
- type: mrr_at_5
|
| 107 |
+
value: 85.316
|
| 108 |
task:
|
| 109 |
type: Retrieval
|
| 110 |
- dataset:
|
|
|
|
| 115 |
type: jinaai/german-STSbenchmark
|
| 116 |
metrics:
|
| 117 |
- type: cos_sim_spearman
|
| 118 |
+
value: 84.67696933608695
|
| 119 |
task:
|
| 120 |
type: STS
|
| 121 |
- dataset:
|
|
|
|
| 126 |
type: jinaai/german-STSbenchmark
|
| 127 |
metrics:
|
| 128 |
- type: cos_sim_spearman
|
| 129 |
+
value: 88.048957974805
|
| 130 |
task:
|
| 131 |
type: STS
|
| 132 |
- dataset:
|
|
|
|
| 137 |
type: mteb/amazon_massive_intent
|
| 138 |
metrics:
|
| 139 |
- type: accuracy
|
| 140 |
+
value: 66.25084061869536
|
| 141 |
task:
|
| 142 |
type: Classification
|
| 143 |
- dataset:
|
|
|
|
| 148 |
type: mteb/amazon_massive_intent
|
| 149 |
metrics:
|
| 150 |
- type: accuracy
|
| 151 |
+
value: 66.44859813084113
|
| 152 |
task:
|
| 153 |
type: Classification
|
| 154 |
- dataset:
|
|
|
|
| 159 |
type: mteb/amazon_massive_scenario
|
| 160 |
metrics:
|
| 161 |
- type: accuracy
|
| 162 |
+
value: 72.51176866173503
|
| 163 |
task:
|
| 164 |
type: Classification
|
| 165 |
- dataset:
|
|
|
|
| 170 |
type: mteb/amazon_massive_scenario
|
| 171 |
metrics:
|
| 172 |
- type: accuracy
|
| 173 |
+
value: 72.02164289227742
|
| 174 |
task:
|
| 175 |
type: Classification
|
| 176 |
- dataset:
|
|
|
|
| 181 |
type: mteb/mtop_domain
|
| 182 |
metrics:
|
| 183 |
- type: accuracy
|
| 184 |
+
value: 89.00253592561285
|
| 185 |
task:
|
| 186 |
type: Classification
|
| 187 |
- dataset:
|
|
|
|
| 192 |
type: mteb/mtop_domain
|
| 193 |
metrics:
|
| 194 |
- type: accuracy
|
| 195 |
+
value: 87.70798898071626
|
| 196 |
task:
|
| 197 |
type: Classification
|
| 198 |
- dataset:
|
|
|
|
| 203 |
type: mteb/mtop_intent
|
| 204 |
metrics:
|
| 205 |
- type: accuracy
|
| 206 |
+
value: 70.06198929275853
|
| 207 |
task:
|
| 208 |
type: Classification
|
| 209 |
- dataset:
|
|
|
|
| 214 |
type: mteb/mtop_intent
|
| 215 |
metrics:
|
| 216 |
- type: accuracy
|
| 217 |
+
value: 68.6060606060606
|
| 218 |
task:
|
| 219 |
type: Classification
|
| 220 |
- dataset:
|
|
|
|
| 225 |
type: google-research-datasets/paws-x
|
| 226 |
metrics:
|
| 227 |
- type: ap
|
| 228 |
+
value: 57.47670853851811
|
| 229 |
task:
|
| 230 |
type: PairClassification
|
| 231 |
- dataset:
|
|
|
|
| 236 |
type: google-research-datasets/paws-x
|
| 237 |
metrics:
|
| 238 |
- type: ap
|
| 239 |
+
value: 52.85587710877178
|
| 240 |
task:
|
| 241 |
type: PairClassification
|
| 242 |
- dataset:
|
|
|
|
| 247 |
type: mteb/sts22-crosslingual-sts
|
| 248 |
metrics:
|
| 249 |
- type: cos_sim_spearman
|
| 250 |
+
value: 50.63839763951755
|
| 251 |
task:
|
| 252 |
type: STS
|
| 253 |
- dataset:
|
|
|
|
| 258 |
type: slvnwhrl/tenkgnad-clustering-p2p
|
| 259 |
metrics:
|
| 260 |
- type: v_measure
|
| 261 |
+
value: 37.996685796529817
|
| 262 |
task:
|
| 263 |
type: Clustering
|
| 264 |
- dataset:
|
|
|
|
| 269 |
type: slvnwhrl/tenkgnad-clustering-s2s
|
| 270 |
metrics:
|
| 271 |
- type: v_measure
|
| 272 |
+
value: 23.71145428041516
|
| 273 |
task:
|
| 274 |
type: Clustering
|
| 275 |
- dataset:
|
|
|
|
| 280 |
type: aari1995/false_friends_de_en_mteb
|
| 281 |
metrics:
|
| 282 |
- type: ap
|
| 283 |
+
value: 71.22096746794873
|
| 284 |
task:
|
| 285 |
type: PairClassification
|
| 286 |
- dataset:
|
|
|
|
| 291 |
type: jinaai/german-STSbenchmark
|
| 292 |
metrics:
|
| 293 |
- type: cos_sim_spearman
|
| 294 |
+
value: 84.67698604065061
|
| 295 |
task:
|
| 296 |
type: STS
|
| 297 |
- dataset:
|
|
|
|
| 302 |
type: jinaai/german-STSbenchmark
|
| 303 |
metrics:
|
| 304 |
- type: cos_sim_spearman
|
| 305 |
+
value: 88.048957974805
|
| 306 |
task:
|
| 307 |
type: STS
|
| 308 |
---
|