Add evaluation results for model mteb/bm25s revision 0_1_10
#4
by
Samoed - opened
This view is limited to 50 files because it contains too many changes.
See the raw diff here.
- .eval_results/AILACasedocs.yaml +12 -0
- .eval_results/AILAStatutes.yaml +12 -0
- .eval_results/AppsRetrieval.yaml +12 -0
- .eval_results/ArguAna.yaml +12 -0
- .eval_results/CQADupstackAndroidRetrieval.yaml +12 -0
- .eval_results/CQADupstackEnglishRetrieval.yaml +12 -0
- .eval_results/CQADupstackGamingRetrieval.yaml +12 -0
- .eval_results/CQADupstackGisRetrieval.yaml +12 -0
- .eval_results/CQADupstackMathematicaRetrieval.yaml +12 -0
- .eval_results/CQADupstackPhysicsRetrieval.yaml +12 -0
- .eval_results/CQADupstackProgrammersRetrieval.yaml +12 -0
- .eval_results/CQADupstackRetrieval.yaml +12 -0
- .eval_results/CQADupstackStatsRetrieval.yaml +12 -0
- .eval_results/CQADupstackTexRetrieval.yaml +12 -0
- .eval_results/CQADupstackUnixRetrieval.yaml +12 -0
- .eval_results/CQADupstackWebmastersRetrieval.yaml +12 -0
- .eval_results/CQADupstackWordpressRetrieval.yaml +12 -0
- .eval_results/CUREv1.yaml +204 -0
- .eval_results/ChatDoctorRetrieval.yaml +12 -0
- .eval_results/ClimateFEVER.yaml +12 -0
- .eval_results/CmedqaRetrieval.yaml +12 -0
- .eval_results/Code1Retrieval.yaml +12 -0
- .eval_results/DBPedia.yaml +12 -0
- .eval_results/DS1000Retrieval.yaml +12 -0
- .eval_results/EnglishFinance1Retrieval.yaml +12 -0
- .eval_results/EnglishFinance2Retrieval.yaml +12 -0
- .eval_results/EnglishFinance3Retrieval.yaml +12 -0
- .eval_results/EnglishFinance4Retrieval.yaml +12 -0
- .eval_results/EnglishHealthcare1Retrieval.yaml +12 -0
- .eval_results/FEVER.yaml +18 -0
- .eval_results/FiQA2018.yaml +18 -0
- .eval_results/FinQARetrieval.yaml +12 -0
- .eval_results/FinanceBenchRetrieval.yaml +12 -0
- .eval_results/French1Retrieval.yaml +12 -0
- .eval_results/FrenchLegal1Retrieval.yaml +12 -0
- .eval_results/FreshStackRetrieval.yaml +12 -0
- .eval_results/German1Retrieval.yaml +12 -0
- .eval_results/GermanHealthcare1Retrieval.yaml +12 -0
- .eval_results/GermanLegal1Retrieval.yaml +12 -0
- .eval_results/HC3FinanceRetrieval.yaml +12 -0
- .eval_results/HotpotQA.yaml +18 -0
- .eval_results/HumanEvalRetrieval.yaml +12 -0
- .eval_results/JaCWIRRetrieval.yaml +12 -0
- .eval_results/JaGovFaqsRetrieval.yaml +12 -0
- .eval_results/JapaneseCode1Retrieval.yaml +12 -0
- .eval_results/JapaneseLegal1Retrieval.yaml +12 -0
- .eval_results/JaqketRetrieval.yaml +12 -0
- .eval_results/LegalQuAD.yaml +12 -0
- .eval_results/LegalSummarization.yaml +12 -0
- .eval_results/MBPPRetrieval.yaml +12 -0
.eval_results/AILACasedocs.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/AILA_casedocs
|
| 3 |
+
revision: 4106e6bcc72e0698d714ea8b101355e3e238431a
|
| 4 |
+
task_id: AILACasedocs_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.27837
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/AILA_casedocs
|
| 9 |
+
revision: 4106e6bcc72e0698d714ea8b101355e3e238431a
|
| 10 |
+
task_id: AILACasedocs
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.27837
|
.eval_results/AILAStatutes.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/AILA_statutes
|
| 3 |
+
revision: ebfcd844eadd3d667efa3c57fc5c8c87f5c2867e
|
| 4 |
+
task_id: AILAStatutes_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.21618
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/AILA_statutes
|
| 9 |
+
revision: ebfcd844eadd3d667efa3c57fc5c8c87f5c2867e
|
| 10 |
+
task_id: AILAStatutes
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.21618
|
.eval_results/AppsRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: CoIR-Retrieval/apps
|
| 3 |
+
revision: f22508f96b7a36c2415181ed8bb76f76e04ae2d5
|
| 4 |
+
task_id: AppsRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.04764
|
| 7 |
+
- dataset:
|
| 8 |
+
id: CoIR-Retrieval/apps
|
| 9 |
+
revision: f22508f96b7a36c2415181ed8bb76f76e04ae2d5
|
| 10 |
+
task_id: AppsRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.04764
|
.eval_results/ArguAna.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/arguana
|
| 3 |
+
revision: c22ab2a51041ffd869aaddef7af8d8215647e41a
|
| 4 |
+
task_id: ArguAna_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.49276
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/arguana
|
| 9 |
+
revision: c22ab2a51041ffd869aaddef7af8d8215647e41a
|
| 10 |
+
task_id: ArguAna
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.49276
|
.eval_results/CQADupstackAndroidRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/CQADupstackAndroidRetrieval
|
| 3 |
+
revision: 9be4c0e46342e8e3aff577a89b9a1ec9bc6b4af3
|
| 4 |
+
task_id: CQADupstackAndroidRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.39693
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/CQADupstackAndroidRetrieval
|
| 9 |
+
revision: 9be4c0e46342e8e3aff577a89b9a1ec9bc6b4af3
|
| 10 |
+
task_id: CQADupstackAndroidRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.39693
|
.eval_results/CQADupstackEnglishRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/cqadupstack-english
|
| 3 |
+
revision: ad9991cb51e31e31e430383c75ffb2885547b5f0
|
| 4 |
+
task_id: CQADupstackEnglishRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.34746
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/cqadupstack-english
|
| 9 |
+
revision: ad9991cb51e31e31e430383c75ffb2885547b5f0
|
| 10 |
+
task_id: CQADupstackEnglishRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.34746
|
.eval_results/CQADupstackGamingRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/cqadupstack-gaming
|
| 3 |
+
revision: 4885aa143210c98657558c04aaf3dc47cfb54340
|
| 4 |
+
task_id: CQADupstackGamingRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.48471
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/cqadupstack-gaming
|
| 9 |
+
revision: 4885aa143210c98657558c04aaf3dc47cfb54340
|
| 10 |
+
task_id: CQADupstackGamingRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.48471
|
.eval_results/CQADupstackGisRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/cqadupstack-gis
|
| 3 |
+
revision: 5003b3064772da1887988e05400cf3806fe491f2
|
| 4 |
+
task_id: CQADupstackGisRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.3083
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/cqadupstack-gis
|
| 9 |
+
revision: 5003b3064772da1887988e05400cf3806fe491f2
|
| 10 |
+
task_id: CQADupstackGisRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.3083
|
.eval_results/CQADupstackMathematicaRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/cqadupstack-mathematica
|
| 3 |
+
revision: 90fceea13679c63fe563ded68f3b6f06e50061de
|
| 4 |
+
task_id: CQADupstackMathematicaRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.22017
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/cqadupstack-mathematica
|
| 9 |
+
revision: 90fceea13679c63fe563ded68f3b6f06e50061de
|
| 10 |
+
task_id: CQADupstackMathematicaRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.22017
|
.eval_results/CQADupstackPhysicsRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/cqadupstack-physics
|
| 3 |
+
revision: 79531abbd1fb92d06c6d6315a0cbbbf5bb247ea4
|
| 4 |
+
task_id: CQADupstackPhysicsRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.34926
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/cqadupstack-physics
|
| 9 |
+
revision: 79531abbd1fb92d06c6d6315a0cbbbf5bb247ea4
|
| 10 |
+
task_id: CQADupstackPhysicsRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.34926
|
.eval_results/CQADupstackProgrammersRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/cqadupstack-programmers
|
| 3 |
+
revision: 6184bc1440d2dbc7612be22b50686b8826d22b32
|
| 4 |
+
task_id: CQADupstackProgrammersRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.298
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/cqadupstack-programmers
|
| 9 |
+
revision: 6184bc1440d2dbc7612be22b50686b8826d22b32
|
| 10 |
+
task_id: CQADupstackProgrammersRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.298
|
.eval_results/CQADupstackRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: aggregate tasks do not have a path
|
| 3 |
+
revision: '1'
|
| 4 |
+
task_id: CQADupstackRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.318642
|
| 7 |
+
- dataset:
|
| 8 |
+
id: aggregate tasks do not have a path
|
| 9 |
+
revision: '1'
|
| 10 |
+
task_id: CQADupstackRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.318642
|
.eval_results/CQADupstackStatsRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/cqadupstack-stats
|
| 3 |
+
revision: 65ac3a16b8e91f9cee4c9828cc7c335575432a2a
|
| 4 |
+
task_id: CQADupstackStatsRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.29019
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/cqadupstack-stats
|
| 9 |
+
revision: 65ac3a16b8e91f9cee4c9828cc7c335575432a2a
|
| 10 |
+
task_id: CQADupstackStatsRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.29019
|
.eval_results/CQADupstackTexRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/cqadupstack-tex
|
| 3 |
+
revision: 46989137a86843e03a6195de44b09deda022eec7
|
| 4 |
+
task_id: CQADupstackTexRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.24397
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/cqadupstack-tex
|
| 9 |
+
revision: 46989137a86843e03a6195de44b09deda022eec7
|
| 10 |
+
task_id: CQADupstackTexRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.24397
|
.eval_results/CQADupstackUnixRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/cqadupstack-unix
|
| 3 |
+
revision: 6c6430d3a6d36f8d2a829195bc5dc94d7e063e53
|
| 4 |
+
task_id: CQADupstackUnixRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.29165
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/cqadupstack-unix
|
| 9 |
+
revision: 6c6430d3a6d36f8d2a829195bc5dc94d7e063e53
|
| 10 |
+
task_id: CQADupstackUnixRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.29165
|
.eval_results/CQADupstackWebmastersRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/cqadupstack-webmasters
|
| 3 |
+
revision: 160c094312a0e1facb97e55eeddb698c0abe3571
|
| 4 |
+
task_id: CQADupstackWebmastersRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.31381
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/cqadupstack-webmasters
|
| 9 |
+
revision: 160c094312a0e1facb97e55eeddb698c0abe3571
|
| 10 |
+
task_id: CQADupstackWebmastersRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.31381
|
.eval_results/CQADupstackWordpressRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/cqadupstack-wordpress
|
| 3 |
+
revision: 4ffe81d471b1924886b33c7567bfb200e9eec5c4
|
| 4 |
+
task_id: CQADupstackWordpressRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.27925
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/cqadupstack-wordpress
|
| 9 |
+
revision: 4ffe81d471b1924886b33c7567bfb200e9eec5c4
|
| 10 |
+
task_id: CQADupstackWordpressRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.27925
|
.eval_results/CUREv1.yaml
ADDED
|
@@ -0,0 +1,204 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: clinia/CUREv1
|
| 3 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 4 |
+
task_id: CUREv1_en_all
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.35481
|
| 7 |
+
- dataset:
|
| 8 |
+
id: clinia/CUREv1
|
| 9 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 10 |
+
task_id: CUREv1_es_all
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.01157
|
| 13 |
+
- dataset:
|
| 14 |
+
id: clinia/CUREv1
|
| 15 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 16 |
+
task_id: CUREv1_fr_all
|
| 17 |
+
notes: Created by mteb
|
| 18 |
+
value: 0.01796
|
| 19 |
+
- dataset:
|
| 20 |
+
id: clinia/CUREv1
|
| 21 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 22 |
+
task_id: CUREv1_en_dentistry_and_oral_health
|
| 23 |
+
notes: Created by mteb
|
| 24 |
+
value: 0.38853
|
| 25 |
+
- dataset:
|
| 26 |
+
id: clinia/CUREv1
|
| 27 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 28 |
+
task_id: CUREv1_es_dentistry_and_oral_health
|
| 29 |
+
notes: Created by mteb
|
| 30 |
+
value: 0.00791
|
| 31 |
+
- dataset:
|
| 32 |
+
id: clinia/CUREv1
|
| 33 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 34 |
+
task_id: CUREv1_fr_dentistry_and_oral_health
|
| 35 |
+
notes: Created by mteb
|
| 36 |
+
value: 0.0137
|
| 37 |
+
- dataset:
|
| 38 |
+
id: clinia/CUREv1
|
| 39 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 40 |
+
task_id: CUREv1_en_dermatology
|
| 41 |
+
notes: Created by mteb
|
| 42 |
+
value: 0.40305
|
| 43 |
+
- dataset:
|
| 44 |
+
id: clinia/CUREv1
|
| 45 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 46 |
+
task_id: CUREv1_es_dermatology
|
| 47 |
+
notes: Created by mteb
|
| 48 |
+
value: 0.04687
|
| 49 |
+
- dataset:
|
| 50 |
+
id: clinia/CUREv1
|
| 51 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 52 |
+
task_id: CUREv1_fr_dermatology
|
| 53 |
+
notes: Created by mteb
|
| 54 |
+
value: 0.07281
|
| 55 |
+
- dataset:
|
| 56 |
+
id: clinia/CUREv1
|
| 57 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 58 |
+
task_id: CUREv1_en_gastroenterology
|
| 59 |
+
notes: Created by mteb
|
| 60 |
+
value: 0.30019
|
| 61 |
+
- dataset:
|
| 62 |
+
id: clinia/CUREv1
|
| 63 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 64 |
+
task_id: CUREv1_es_gastroenterology
|
| 65 |
+
notes: Created by mteb
|
| 66 |
+
value: 0.01412
|
| 67 |
+
- dataset:
|
| 68 |
+
id: clinia/CUREv1
|
| 69 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 70 |
+
task_id: CUREv1_fr_gastroenterology
|
| 71 |
+
notes: Created by mteb
|
| 72 |
+
value: 0.02969
|
| 73 |
+
- dataset:
|
| 74 |
+
id: clinia/CUREv1
|
| 75 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 76 |
+
task_id: CUREv1_en_genetics
|
| 77 |
+
notes: Created by mteb
|
| 78 |
+
value: 0.41022
|
| 79 |
+
- dataset:
|
| 80 |
+
id: clinia/CUREv1
|
| 81 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 82 |
+
task_id: CUREv1_es_genetics
|
| 83 |
+
notes: Created by mteb
|
| 84 |
+
value: 0.03798
|
| 85 |
+
- dataset:
|
| 86 |
+
id: clinia/CUREv1
|
| 87 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 88 |
+
task_id: CUREv1_fr_genetics
|
| 89 |
+
notes: Created by mteb
|
| 90 |
+
value: 0.08926
|
| 91 |
+
- dataset:
|
| 92 |
+
id: clinia/CUREv1
|
| 93 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 94 |
+
task_id: CUREv1_en_neuroscience_and_neurology
|
| 95 |
+
notes: Created by mteb
|
| 96 |
+
value: 0.31575
|
| 97 |
+
- dataset:
|
| 98 |
+
id: clinia/CUREv1
|
| 99 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 100 |
+
task_id: CUREv1_es_neuroscience_and_neurology
|
| 101 |
+
notes: Created by mteb
|
| 102 |
+
value: 0.00768
|
| 103 |
+
- dataset:
|
| 104 |
+
id: clinia/CUREv1
|
| 105 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 106 |
+
task_id: CUREv1_fr_neuroscience_and_neurology
|
| 107 |
+
notes: Created by mteb
|
| 108 |
+
value: 0.02533
|
| 109 |
+
- dataset:
|
| 110 |
+
id: clinia/CUREv1
|
| 111 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 112 |
+
task_id: CUREv1_en_orthopedic_surgery
|
| 113 |
+
notes: Created by mteb
|
| 114 |
+
value: 0.39297
|
| 115 |
+
- dataset:
|
| 116 |
+
id: clinia/CUREv1
|
| 117 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 118 |
+
task_id: CUREv1_es_orthopedic_surgery
|
| 119 |
+
notes: Created by mteb
|
| 120 |
+
value: 0.02131
|
| 121 |
+
- dataset:
|
| 122 |
+
id: clinia/CUREv1
|
| 123 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 124 |
+
task_id: CUREv1_fr_orthopedic_surgery
|
| 125 |
+
notes: Created by mteb
|
| 126 |
+
value: 0.04247
|
| 127 |
+
- dataset:
|
| 128 |
+
id: clinia/CUREv1
|
| 129 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 130 |
+
task_id: CUREv1_en_otorhinolaryngology
|
| 131 |
+
notes: Created by mteb
|
| 132 |
+
value: 0.33081
|
| 133 |
+
- dataset:
|
| 134 |
+
id: clinia/CUREv1
|
| 135 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 136 |
+
task_id: CUREv1_es_otorhinolaryngology
|
| 137 |
+
notes: Created by mteb
|
| 138 |
+
value: 0.00483
|
| 139 |
+
- dataset:
|
| 140 |
+
id: clinia/CUREv1
|
| 141 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 142 |
+
task_id: CUREv1_fr_otorhinolaryngology
|
| 143 |
+
notes: Created by mteb
|
| 144 |
+
value: 0.02196
|
| 145 |
+
- dataset:
|
| 146 |
+
id: clinia/CUREv1
|
| 147 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 148 |
+
task_id: CUREv1_en_plastic_surgery
|
| 149 |
+
notes: Created by mteb
|
| 150 |
+
value: 0.34636
|
| 151 |
+
- dataset:
|
| 152 |
+
id: clinia/CUREv1
|
| 153 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 154 |
+
task_id: CUREv1_es_plastic_surgery
|
| 155 |
+
notes: Created by mteb
|
| 156 |
+
value: 0.01692
|
| 157 |
+
- dataset:
|
| 158 |
+
id: clinia/CUREv1
|
| 159 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 160 |
+
task_id: CUREv1_fr_plastic_surgery
|
| 161 |
+
notes: Created by mteb
|
| 162 |
+
value: 0.02923
|
| 163 |
+
- dataset:
|
| 164 |
+
id: clinia/CUREv1
|
| 165 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 166 |
+
task_id: CUREv1_en_psychiatry_and_psychology
|
| 167 |
+
notes: Created by mteb
|
| 168 |
+
value: 0.34984
|
| 169 |
+
- dataset:
|
| 170 |
+
id: clinia/CUREv1
|
| 171 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 172 |
+
task_id: CUREv1_es_psychiatry_and_psychology
|
| 173 |
+
notes: Created by mteb
|
| 174 |
+
value: 0.01113
|
| 175 |
+
- dataset:
|
| 176 |
+
id: clinia/CUREv1
|
| 177 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 178 |
+
task_id: CUREv1_fr_psychiatry_and_psychology
|
| 179 |
+
notes: Created by mteb
|
| 180 |
+
value: 0.02743
|
| 181 |
+
- dataset:
|
| 182 |
+
id: clinia/CUREv1
|
| 183 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 184 |
+
task_id: CUREv1_en_pulmonology
|
| 185 |
+
notes: Created by mteb
|
| 186 |
+
value: 0.34924
|
| 187 |
+
- dataset:
|
| 188 |
+
id: clinia/CUREv1
|
| 189 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 190 |
+
task_id: CUREv1_es_pulmonology
|
| 191 |
+
notes: Created by mteb
|
| 192 |
+
value: 0.01324
|
| 193 |
+
- dataset:
|
| 194 |
+
id: clinia/CUREv1
|
| 195 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 196 |
+
task_id: CUREv1_fr_pulmonology
|
| 197 |
+
notes: Created by mteb
|
| 198 |
+
value: 0.01515
|
| 199 |
+
- dataset:
|
| 200 |
+
id: clinia/CUREv1
|
| 201 |
+
revision: 3bcf51c91e04d04a8a3329dfbe988b964c5cbe83
|
| 202 |
+
task_id: CUREv1
|
| 203 |
+
notes: Created by mteb
|
| 204 |
+
value: 0.13697939393939393
|
.eval_results/ChatDoctorRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: embedding-benchmark/ChatDoctor_HealthCareMagic
|
| 3 |
+
revision: 50c2986fedffa33b38afd5c1752026f8e9e5ed1d
|
| 4 |
+
task_id: ChatDoctorRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.31764
|
| 7 |
+
- dataset:
|
| 8 |
+
id: embedding-benchmark/ChatDoctor_HealthCareMagic
|
| 9 |
+
revision: 50c2986fedffa33b38afd5c1752026f8e9e5ed1d
|
| 10 |
+
task_id: ChatDoctorRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.31764
|
.eval_results/ClimateFEVER.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/climate-fever
|
| 3 |
+
revision: 47f2ac6acb640fc46020b02a5b59fdda04d39380
|
| 4 |
+
task_id: ClimateFEVER_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.13621
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/climate-fever
|
| 9 |
+
revision: 47f2ac6acb640fc46020b02a5b59fdda04d39380
|
| 10 |
+
task_id: ClimateFEVER
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.13621
|
.eval_results/CmedqaRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/CmedqaRetrieval
|
| 3 |
+
revision: c476f85bf03d6642ec66bf54b9a551c88108bbb4
|
| 4 |
+
task_id: CmedqaRetrieval_default_dev
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.01337
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/CmedqaRetrieval
|
| 9 |
+
revision: c476f85bf03d6642ec66bf54b9a551c88108bbb4
|
| 10 |
+
task_id: CmedqaRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.01337
|
.eval_results/Code1Retrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb-private/Code1Retrieval
|
| 3 |
+
revision: 94d25599a7e0221484f31749448e5ea217484e41
|
| 4 |
+
task_id: Code1Retrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.44744
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb-private/Code1Retrieval
|
| 9 |
+
revision: 94d25599a7e0221484f31749448e5ea217484e41
|
| 10 |
+
task_id: Code1Retrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.44744
|
.eval_results/DBPedia.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/dbpedia
|
| 3 |
+
revision: c0f706b76e590d620bd6618b3ca8efdd34e2d659
|
| 4 |
+
task_id: DBPedia_default_dev
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.34447
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/dbpedia
|
| 9 |
+
revision: c0f706b76e590d620bd6618b3ca8efdd34e2d659
|
| 10 |
+
task_id: DBPedia_default_test
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.29907
|
.eval_results/DS1000Retrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: embedding-benchmark/DS1000
|
| 3 |
+
revision: 25cd4dc8172e799235d83c66439b6b7b8e6583ec
|
| 4 |
+
task_id: DS1000Retrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.41454
|
| 7 |
+
- dataset:
|
| 8 |
+
id: embedding-benchmark/DS1000
|
| 9 |
+
revision: 25cd4dc8172e799235d83c66439b6b7b8e6583ec
|
| 10 |
+
task_id: DS1000Retrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.41454
|
.eval_results/EnglishFinance1Retrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb-private/EnglishFinance1Retrieval
|
| 3 |
+
revision: b2816ead5389ee383019bb2e50df9f1aac8229d8
|
| 4 |
+
task_id: EnglishFinance1Retrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.75345
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb-private/EnglishFinance1Retrieval
|
| 9 |
+
revision: b2816ead5389ee383019bb2e50df9f1aac8229d8
|
| 10 |
+
task_id: EnglishFinance1Retrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.75345
|
.eval_results/EnglishFinance2Retrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb-private/EnglishFinance2Retrieval
|
| 3 |
+
revision: 346d5039b9ec75a7b80f8ff008d5ca3df126f5aa
|
| 4 |
+
task_id: EnglishFinance2Retrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.76472
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb-private/EnglishFinance2Retrieval
|
| 9 |
+
revision: 346d5039b9ec75a7b80f8ff008d5ca3df126f5aa
|
| 10 |
+
task_id: EnglishFinance2Retrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.76472
|
.eval_results/EnglishFinance3Retrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb-private/EnglishFinance3Retrieval
|
| 3 |
+
revision: 5ed0bc0fffa309e99400ea800397931749d12cd2
|
| 4 |
+
task_id: EnglishFinance3Retrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.45123
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb-private/EnglishFinance3Retrieval
|
| 9 |
+
revision: 5ed0bc0fffa309e99400ea800397931749d12cd2
|
| 10 |
+
task_id: EnglishFinance3Retrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.45123
|
.eval_results/EnglishFinance4Retrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb-private/EnglishFinance4Retrieval
|
| 3 |
+
revision: 2fdb7001309f897d50d38d196a3fd0f03c913810
|
| 4 |
+
task_id: EnglishFinance4Retrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.3173
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb-private/EnglishFinance4Retrieval
|
| 9 |
+
revision: 2fdb7001309f897d50d38d196a3fd0f03c913810
|
| 10 |
+
task_id: EnglishFinance4Retrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.3173
|
.eval_results/EnglishHealthcare1Retrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb-private/EnglishHealthcare1Retrieval
|
| 3 |
+
revision: 393c24e85114d44c43259fb2d1c5639c5d09809d
|
| 4 |
+
task_id: EnglishHealthcare1Retrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.68748
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb-private/EnglishHealthcare1Retrieval
|
| 9 |
+
revision: 393c24e85114d44c43259fb2d1c5639c5d09809d
|
| 10 |
+
task_id: EnglishHealthcare1Retrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.68748
|
.eval_results/FEVER.yaml
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/fever
|
| 3 |
+
revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
|
| 4 |
+
task_id: FEVER_default_dev
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.49778
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/fever
|
| 9 |
+
revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
|
| 10 |
+
task_id: FEVER_default_test
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.4809
|
| 13 |
+
- dataset:
|
| 14 |
+
id: mteb/fever
|
| 15 |
+
revision: bea83ef9e8fb933d90a2f1d5515737465d613e12
|
| 16 |
+
task_id: FEVER_default_train
|
| 17 |
+
notes: Created by mteb
|
| 18 |
+
value: 0.38431
|
.eval_results/FiQA2018.yaml
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/fiqa
|
| 3 |
+
revision: 27a168819829fe9bcd655c2df245fb19452e8e06
|
| 4 |
+
task_id: FiQA2018_default_dev
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.2592
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/fiqa
|
| 9 |
+
revision: 27a168819829fe9bcd655c2df245fb19452e8e06
|
| 10 |
+
task_id: FiQA2018_default_test
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.25139
|
| 13 |
+
- dataset:
|
| 14 |
+
id: mteb/fiqa
|
| 15 |
+
revision: 27a168819829fe9bcd655c2df245fb19452e8e06
|
| 16 |
+
task_id: FiQA2018_default_train
|
| 17 |
+
notes: Created by mteb
|
| 18 |
+
value: 0.24794
|
.eval_results/FinQARetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: embedding-benchmark/FinQA
|
| 3 |
+
revision: bdd1903ce03153129480bfc14b710e3d612c1efd
|
| 4 |
+
task_id: FinQARetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.73872
|
| 7 |
+
- dataset:
|
| 8 |
+
id: embedding-benchmark/FinQA
|
| 9 |
+
revision: bdd1903ce03153129480bfc14b710e3d612c1efd
|
| 10 |
+
task_id: FinQARetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.73872
|
.eval_results/FinanceBenchRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: embedding-benchmark/FinanceBench
|
| 3 |
+
revision: e68478442112cae36b70a216f52cc2777acf0a7e
|
| 4 |
+
task_id: FinanceBenchRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.46676
|
| 7 |
+
- dataset:
|
| 8 |
+
id: embedding-benchmark/FinanceBench
|
| 9 |
+
revision: e68478442112cae36b70a216f52cc2777acf0a7e
|
| 10 |
+
task_id: FinanceBenchRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.46676
|
.eval_results/French1Retrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb-private/French1Retrieval
|
| 3 |
+
revision: c5c5a44f75dff57be44e5623e817239b050bf0f2
|
| 4 |
+
task_id: French1Retrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.78323
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb-private/French1Retrieval
|
| 9 |
+
revision: c5c5a44f75dff57be44e5623e817239b050bf0f2
|
| 10 |
+
task_id: French1Retrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.78323
|
.eval_results/FrenchLegal1Retrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb-private/FrenchLegal1Retrieval
|
| 3 |
+
revision: 6d7308571a1572e22d5c0c1cb87385a7bb6b2c6d
|
| 4 |
+
task_id: FrenchLegal1Retrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.94897
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb-private/FrenchLegal1Retrieval
|
| 9 |
+
revision: 6d7308571a1572e22d5c0c1cb87385a7bb6b2c6d
|
| 10 |
+
task_id: FrenchLegal1Retrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.94897
|
.eval_results/FreshStackRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: embedding-benchmark/FreshStack_mteb
|
| 3 |
+
revision: 7a20df1abe4dafc46f93f9a7965bf9c6968bdf04
|
| 4 |
+
task_id: FreshStackRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.27888
|
| 7 |
+
- dataset:
|
| 8 |
+
id: embedding-benchmark/FreshStack_mteb
|
| 9 |
+
revision: 7a20df1abe4dafc46f93f9a7965bf9c6968bdf04
|
| 10 |
+
task_id: FreshStackRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.27888
|
.eval_results/German1Retrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb-private/German1Retrieval
|
| 3 |
+
revision: d83dd140fc8fdf96372a6e9193cd4fd2d5cb72bd
|
| 4 |
+
task_id: German1Retrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.86465
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb-private/German1Retrieval
|
| 9 |
+
revision: d83dd140fc8fdf96372a6e9193cd4fd2d5cb72bd
|
| 10 |
+
task_id: German1Retrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.86465
|
.eval_results/GermanHealthcare1Retrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb-private/GermanHealthcare1Retrieval
|
| 3 |
+
revision: 53e9a6fb88b48b7513e9d2cc2218e3415f4e45f8
|
| 4 |
+
task_id: GermanHealthcare1Retrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.37248
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb-private/GermanHealthcare1Retrieval
|
| 9 |
+
revision: 53e9a6fb88b48b7513e9d2cc2218e3415f4e45f8
|
| 10 |
+
task_id: GermanHealthcare1Retrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.37248
|
.eval_results/GermanLegal1Retrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb-private/GermanLegal1Retrieval
|
| 3 |
+
revision: 65ea369daff680b77f90b560e7e97d2ab4ec5072
|
| 4 |
+
task_id: GermanLegal1Retrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.66876
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb-private/GermanLegal1Retrieval
|
| 9 |
+
revision: 65ea369daff680b77f90b560e7e97d2ab4ec5072
|
| 10 |
+
task_id: GermanLegal1Retrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.66876
|
.eval_results/HC3FinanceRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: embedding-benchmark/HC3Finance
|
| 3 |
+
revision: fda6fad068f2ed814d99f29dc95dbb28ac586943
|
| 4 |
+
task_id: HC3FinanceRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.28977
|
| 7 |
+
- dataset:
|
| 8 |
+
id: embedding-benchmark/HC3Finance
|
| 9 |
+
revision: fda6fad068f2ed814d99f29dc95dbb28ac586943
|
| 10 |
+
task_id: HC3FinanceRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.28977
|
.eval_results/HotpotQA.yaml
ADDED
|
@@ -0,0 +1,18 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/hotpotqa
|
| 3 |
+
revision: ab518f4d6fcca38d87c25209f94beba119d02014
|
| 4 |
+
task_id: HotpotQA_default_dev
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.59451
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/hotpotqa
|
| 9 |
+
revision: ab518f4d6fcca38d87c25209f94beba119d02014
|
| 10 |
+
task_id: HotpotQA_default_test
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.56907
|
| 13 |
+
- dataset:
|
| 14 |
+
id: mteb/hotpotqa
|
| 15 |
+
revision: ab518f4d6fcca38d87c25209f94beba119d02014
|
| 16 |
+
task_id: HotpotQA_default_train
|
| 17 |
+
notes: Created by mteb
|
| 18 |
+
value: 0.58909
|
.eval_results/HumanEvalRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: embedding-benchmark/HumanEval
|
| 3 |
+
revision: ed1f48aca747f10bac146795328e2f03326e7625
|
| 4 |
+
task_id: HumanEvalRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.38472
|
| 7 |
+
- dataset:
|
| 8 |
+
id: embedding-benchmark/HumanEval
|
| 9 |
+
revision: ed1f48aca747f10bac146795328e2f03326e7625
|
| 10 |
+
task_id: HumanEvalRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.38472
|
.eval_results/JaCWIRRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/JaCWIRRetrieval
|
| 3 |
+
revision: abf6d5fb6759ad516f998bd887b75420d595672e
|
| 4 |
+
task_id: JaCWIRRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.19066
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/JaCWIRRetrieval
|
| 9 |
+
revision: abf6d5fb6759ad516f998bd887b75420d595672e
|
| 10 |
+
task_id: JaCWIRRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.19066
|
.eval_results/JaGovFaqsRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/JaGovFaqsRetrieval
|
| 3 |
+
revision: 0726b2af53c907628067871e2e7c84e0d8e099c2
|
| 4 |
+
task_id: JaGovFaqsRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.12557
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/JaGovFaqsRetrieval
|
| 9 |
+
revision: 0726b2af53c907628067871e2e7c84e0d8e099c2
|
| 10 |
+
task_id: JaGovFaqsRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.12557
|
.eval_results/JapaneseCode1Retrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb-private/JapaneseCode1Retrieval
|
| 3 |
+
revision: fc4cb6390055e65490dfc42526e1d6a379e8cd86
|
| 4 |
+
task_id: JapaneseCode1Retrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.33855
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb-private/JapaneseCode1Retrieval
|
| 9 |
+
revision: fc4cb6390055e65490dfc42526e1d6a379e8cd86
|
| 10 |
+
task_id: JapaneseCode1Retrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.33855
|
.eval_results/JapaneseLegal1Retrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb-private/JapaneseLegal1Retrieval
|
| 3 |
+
revision: d653557fe66bb6af2b0e2adfc371a24554cf11ce
|
| 4 |
+
task_id: JapaneseLegal1Retrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.11133
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb-private/JapaneseLegal1Retrieval
|
| 9 |
+
revision: d653557fe66bb6af2b0e2adfc371a24554cf11ce
|
| 10 |
+
task_id: JapaneseLegal1Retrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.11133
|
.eval_results/JaqketRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/jaqket
|
| 3 |
+
revision: 3a5b92dad489a61e664c05ed2175bc9220230199
|
| 4 |
+
task_id: JaqketRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.13284
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/jaqket
|
| 9 |
+
revision: 3a5b92dad489a61e664c05ed2175bc9220230199
|
| 10 |
+
task_id: JaqketRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.13284
|
.eval_results/LegalQuAD.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/LegalQuAD
|
| 3 |
+
revision: 37aa6cfb01d48960b0f8e3f17d6e3d99bf1ebc3e
|
| 4 |
+
task_id: LegalQuAD_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.76755
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/LegalQuAD
|
| 9 |
+
revision: 37aa6cfb01d48960b0f8e3f17d6e3d99bf1ebc3e
|
| 10 |
+
task_id: LegalQuAD
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.76755
|
.eval_results/LegalSummarization.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: mteb/legal_summarization
|
| 3 |
+
revision: 3bb1a05c66872889662af04c5691c14489cebd72
|
| 4 |
+
task_id: LegalSummarization_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.60983
|
| 7 |
+
- dataset:
|
| 8 |
+
id: mteb/legal_summarization
|
| 9 |
+
revision: 3bb1a05c66872889662af04c5691c14489cebd72
|
| 10 |
+
task_id: LegalSummarization
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.60983
|
.eval_results/MBPPRetrieval.yaml
ADDED
|
@@ -0,0 +1,12 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
- dataset:
|
| 2 |
+
id: embedding-benchmark/MBPP
|
| 3 |
+
revision: 586a1fd6a0c63fdeda3b49c0293559a81c79cdec
|
| 4 |
+
task_id: MBPPRetrieval_default_test
|
| 5 |
+
notes: Created by mteb
|
| 6 |
+
value: 0.11637
|
| 7 |
+
- dataset:
|
| 8 |
+
id: embedding-benchmark/MBPP
|
| 9 |
+
revision: 586a1fd6a0c63fdeda3b49c0293559a81c79cdec
|
| 10 |
+
task_id: MBPPRetrieval
|
| 11 |
+
notes: Created by mteb
|
| 12 |
+
value: 0.11637
|