BidirLM-1B-Embedding / mteb_v2_eval_prompts.json
TheoDB's picture
Update mteb_v2_eval_prompts.json: add 10 tasks
380da06 verified
{
"BornholmBitextMining": "Retrieve parallel sentences between Danish and Bornholmsk dialect",
"CEDRClassification": "Classify the emotion expressed in the given text into one of five categories: joy, sadness, surprise, fear, or anger",
"DalajClassification": "Classify the linguistic acceptability of the given Swedish sentence",
"NorwegianCourtsBitextMining": "Retrieve parallel sentences between Norwegian Bokmål and Nynorsk",
"ScalaClassification": "Classify the linguistic acceptability of the given Scandinavian sentence",
"SpartQA": "Given a spatial reasoning question, retrieve the passage that answers the question",
"SwednClusteringP2P": "Identify the topic or theme of the given Swedish news articles",
"TempReasonL1": "Given a temporal reasoning question, retrieve the passage that answers the question",
"TwitterHjerneRetrieval": "Given a Danish question, retrieve the corresponding answer",
"WinoGrande": "Given a commonsense reasoning question, retrieve the passage that answers the question",
"AmazonCounterfactualClassification": "Given an Amazon review, judge whether it is counterfactual.",
"AmazonPolarityClassification": "Classifying Amazon reviews into positive or negative sentiment",
"AmazonReviewsClassification": "Classifying the given Amazon review into its appropriate rating category",
"Banking77Classification": "Given an online banking query, find the corresponding intents",
"EmotionClassification": "Classify the emotion expressed in the given Twitter message into one of the six emotions: anger, fear, joy, love, sadness, and surprise",
"ImdbClassification": "Classifying the sentiment expressed in the given movie review text from the IMDB dataset",
"MassiveIntentClassification": "Given a user utterance as query, find the user intents",
"MassiveScenarioClassification": "Given a user utterance as query, find the user scenarios",
"MTOPDomainClassification": "Classifying the intent domain of the given utterance in task-oriented conversation",
"MTOPIntentClassification": "Classifying the intent of the given utterance in task-oriented conversation",
"ToxicConversationsClassification": "Classifying the given comments as either toxic or not toxic",
"TweetSentimentExtractionClassification": "Classifying the sentiment of a given tweet as either positive, negative, or neutral",
"TNews": "Categorizing the given news title",
"IFlyTek": "Given an App description text, find the appropriate fine-grained category",
"MultilingualSentiment": "Classifying sentiment of the customer review into positive, neutral, or negative",
"JDReview": "Classifying sentiment of the customer review for iPhoneinto positive or negative",
"OnlineShopping": "Classifying sentiment of the customer reviewinto positive or negative",
"Waimai": "Classify the customer review from a food takeaway platform into positive or negative",
"ArxivClusteringP2P": "Identify the main and secondary category of Arxiv papers based on the titles and abstracts",
"ArxivClusteringS2S": "Identify the main and secondary category of Arxiv papers based on the titles",
"BiorxivClusteringP2P": "Identify the main category of Biorxiv papers based on the titles and abstracts",
"BiorxivClusteringS2S": "Identify the main category of Biorxiv papers based on the titles",
"MedrxivClusteringP2P": "Identify the main category of Medrxiv papers based on the titles and abstracts",
"MedrxivClusteringS2S": "Identify the main category of Medrxiv papers based on the titles",
"RedditClustering": "Identify the topic or theme of Reddit posts based on the titles",
"RedditClusteringP2P": "Identify the topic or theme of Reddit posts based on the titles and posts",
"StackExchangeClustering": "Identify the topic or theme of StackExchange posts based on the titles",
"StackExchangeClusteringP2P": "Identify the topic or theme of StackExchange posts based on the given paragraphs",
"TwentyNewsgroupsClustering": "Identify the topic or theme of the given news articles",
"CLSClusteringS2S": "Identify the main category of scholar papers based on the titles",
"CLSClusteringP2P": "Identify the main category of scholar papers based on the titles and abstracts",
"ThuNewsClusteringS2S": "Identify the topic or theme of the given news articles based on the titles",
"ThuNewsClusteringP2P": "Identify the topic or theme of the given news articles based on the titles and contents",
"AskUbuntuDupQuestions": "Given a question, retrieve detailed question descriptions from Stackexchange that are duplicates to the given question",
"MindSmallReranking": "Given a query, retrieve documents that answer the query.",
"SciDocsRR": "Given a query, retrieve documents that answer the query.",
"StackOverflowDupQuestions": "Given a question, retrieve detailed question descriptions from Stackexchange that are duplicates to the given question",
"SprintDuplicateQuestions": "Given a question, retrieve detailed question descriptions from Stackexchange that are duplicates to the given question",
"TwitterSemEval2015": "Retrieve semantically similar text.",
"TwitterURLCorpus": "Retrieve semantically similar text.",
"T2Reranking": "Given a query, retrieve documents that answer the query.",
"MmarcoReranking": "Given a query, retrieve documents that answer the query.",
"CMedQAv1": "Given a query, retrieve documents that answer the query.",
"CMedQAv2": "Given a query, retrieve documents that answer the query.",
"Ocnli": "Retrieve semantically similar text.",
"Cmnli": "Retrieve semantically similar text.",
"ArguAna": {
"query": "Given a claim, retrieve documents that support or refute the claim",
"passage": "Given a claim, retrieve documents that support or refute the claim"
},
"ClimateFEVER": "Given a claim, retrieve documents that support or refute the claim",
"ClimateFEVERHardNegatives": "Given a claim, retrieve documents that support or refute the claim",
"DBPedia": "Given a query, retrieve documents that answer the query.",
"FEVER": "Given a claim, retrieve documents that support or refute the claim",
"FEVERHardNegatives": "Given a claim, retrieve documents that support or refute the claim",
"FiQA2018": "Given a query, retrieve documents that answer the query.",
"HotpotQA": "Given a multi-hop question, retrieve documents that can help answer the question",
"HotpotQAHardNegatives": "Given a multi-hop question, retrieve documents that can help answer the question",
"MSMARCO": "Given a web search query, retrieve relevant passages that answer the query",
"NFCorpus": "Given a question, retrieve relevant documents that best answer the question",
"NQ": "Given a question, retrieve Wikipedia passages that answer the question",
"QuoraRetrieval": "Given a query, retrieve documents that answer the query.",
"SCIDOCS": "Given a query, retrieve documents that answer the query.",
"SciFact": "Given a scientific claim, retrieve documents that support or refute the claim",
"Touche2020": "Given a query, retrieve documents that answer the query.",
"Touche2020Retrieval.v3": "Given a query, retrieve documents that answer the query.",
"TRECCOVID": "Given a query, retrieve documents that answer the query.",
"T2Retrieval": "Given a question, retrieve passages that answer the question",
"MMarcoRetrieval": "Given a web search query, retrieve relevant passages that answer the query",
"DuRetrieval": "Given a question, retrieve passages that answer the question",
"CovidRetrieval": "Given a query on COVID-19, retrieve documents that answer the query",
"CmedqaRetrieval": "Given a query, retrieve documents that answer the query.",
"EcomRetrieval": "Given a query, retrieve documents that answer the query.",
"MedicalRetrieval": "Given a query, retrieve documents that answer the query.",
"VideoRetrieval": "Given a query, retrieve documents that answer the query.",
"STSBenchmarkMultilingualSTS": "Retrieve semantically similar text",
"SICKFr": "Retrieve semantically similar text",
"SummEvalFr": "Retrieve semantically similar text.",
"MasakhaNEWSClassification": "Categorizing the given news title",
"OpusparcusPC": "Retrieve semantically similar text",
"PawsX": "Retrieve semantically similar text",
"AlloProfClusteringP2P": "Identify the main category of scholar papers based on the titles and abstracts",
"AlloProfClusteringS2S": "Identify the main category of scholar papers based on the titles",
"HALClusteringS2S": "Identify the main category of scholar papers based on the titles",
"MasakhaNEWSClusteringP2P": "Identify the topic or theme of the given news articles based on the titles and contents",
"MasakhaNEWSClusteringS2S": "Identify the topic or theme of the given news articles based on the titles",
"MLSUMClusteringP2P": "Identify the topic or theme of Reddit posts based on the titles and posts",
"MLSUMClusteringS2S": "Identify the topic or theme of Reddit posts based on the titles",
"SyntecReranking": "Given a question, retrieve passages that answer the question",
"AlloprofReranking": "Given a question, retrieve passages that answer the question",
"AlloprofRetrieval": "Given a question, retrieve passages that answer the question",
"BSARDRetrieval": "Given a question, retrieve passages that answer the question",
"SyntecRetrieval": "Given a question, retrieve passages that answer the question",
"XPQARetrieval": "Given a question, retrieve passages that answer the question",
"MintakaRetrieval": "Given a question, retrieve passages that answer the question",
"CBD": "Classifying the sentiment of a given tweet as either positive, negative, or neutral",
"PolEmo2.0-IN": "Classifying sentiment of the customer review into positive, neutral, or negative",
"PolEmo2.0-OUT": "Classifying sentiment of the customer review into positive, neutral, or negative",
"AllegroReviews": "Classifying sentiment of the customer review into positive, neutral, or negative",
"PAC": "Classify the sentence into one of the two types: 'BEZPIECZNE_POSTANOWIENIE_UMOWNE' and 'KLAUZULA_ABUZYWNA'",
"SICK-E-PL": "Retrieve semantically similar text",
"SICK-R-PL": "Retrieve semantically similar text",
"STS22": "Retrieve semantically similar text",
"AFQMC": "Retrieve semantically similar text",
"BQ": "Retrieve semantically similar text",
"LCQMC": "Retrieve semantically similar text",
"PAWSX": "Retrieve semantically similar text",
"QBQTC": "Retrieve semantically similar text",
"STS12": "Retrieve semantically similar text",
"PPC": "Retrieve semantically similar text",
"CDSC-E": "Retrieve semantically similar text",
"PSC": "Retrieve semantically similar text",
"8TagsClustering": "Identify the topic or theme of the given news articles",
"ArguAna-PL": "Given a claim, retrieve documents that support or refute the claim",
"DBPedia-PL": "Given a query, retrieve documents that answer the query.",
"FiQA-PL": "Given a query, retrieve documents that answer the query.",
"HotpotQA-PL": "Given a multi-hop question, retrieve documents that can help answer the question",
"MSMARCO-PL": "Given a web search query, retrieve relevant passages that answer the query",
"NFCorpus-PL": "Given a question, retrieve relevant documents that best answer the question",
"NQ-PL": "Given a question, retrieve Wikipedia passages that answer the question",
"Quora-PL": "Given a query, retrieve documents that answer the query.",
"SCIDOCS-PL": "Given a query, retrieve documents that answer the query.",
"SciFact-PL": "Given a scientific claim, retrieve documents that support or refute the claim",
"TRECCOVID-PL": "Given a query, retrieve documents that answer the query.",
"GeoreviewClassification": "Classifying sentiment of the customer review into positive, neutral, or negative",
"HeadlineClassification": "Categorizing the given news title",
"InappropriatenessClassification": "Classifying the given comments as either toxic or not toxic",
"KinopoiskClassification": "Classifying the sentiment expressed in the given movie review text from the IMDB dataset",
"RuReviewsClassification": "Classifying sentiment of the customer review into positive, neutral, or negative",
"RuSciBenchGRNTIClassification": "Categorizing the given news title",
"RuSciBenchOECDClassification": "Categorizing the given news title",
"GeoreviewClusteringP2P": "Identify the topic or theme of Reddit posts based on the titles and posts",
"RuSciBenchGRNTIClusteringP2P": "Identify the main category of scholar papers based on the titles and abstracts",
"RuSciBenchOECDClusteringP2P": "Identify the main category of scholar papers based on the titles and abstracts",
"TERRa": "Retrieve semantically similar text.",
"RuBQReranking": "Given a question, retrieve Wikipedia passages that answer the question",
"RiaNewsRetrieval": "Given a query, retrieve documents that answer the query.",
"RuBQRetrieval": "Given a question, retrieve Wikipedia passages that answer the question",
"RUParaPhraserSTS": "Retrieve semantically similar text",
"RuSTSBenchmarkSTS": "Retrieve semantically similar text",
"AppsRetrieval": "Given a query, retrieve documents that answer the query.",
"COIRCodeSearchNetRetrieval": "Given a query, retrieve documents that answer the query.",
"CodeEditSearchRetrieval": "Given a query, retrieve documents that answer the query.",
"CodeFeedbackMT": "Given a query, retrieve documents that answer the query.",
"CodeFeedbackST": "Given a query, retrieve documents that answer the query.",
"CodeSearchNetCCRetrieval": "Given a query, retrieve documents that answer the query.",
"CodeSearchNetRetrieval": "Given a query, retrieve documents that answer the query.",
"CodeTransOceanContest": "Given a query, retrieve documents that answer the query.",
"CodeTransOceanDL": "Given a query, retrieve documents that answer the query.",
"CosQA": "Given a query, retrieve documents that answer the query.",
"StackOverflowQA": "Given a query, retrieve documents that answer the query.",
"SyntheticText2SQL": "Given a query, retrieve documents that answer the query.",
"BibleNLPBitextMining": "Retrieve semantically similar text.",
"BUCC.v2": "Retrieve semantically similar text.",
"DiaBlaBitextMining": "Retrieve semantically similar text.",
"FloresBitextMining": "Retrieve semantically similar text.",
"IN22GenBitextMining": "Retrieve semantically similar text.",
"IndicGenBenchFloresBitextMining": "Retrieve semantically similar text.",
"NollySentiBitextMining": "Retrieve semantically similar text.",
"NTREXBitextMining": "Retrieve semantically similar text.",
"NusaTranslationBitextMining": "Retrieve semantically similar text.",
"NusaXBitextMining": "Retrieve semantically similar text.",
"Tatoeba": "Retrieve semantically similar text.",
"BulgarianStoreReviewSentimentClassfication": "Classifying sentiment of the customer review into positive, neutral, or negative",
"CzechProductReviewSentimentClassification": "Classifying sentiment of the customer review into positive, neutral, or negative",
"GreekLegalCodeClassification": "Categorizing the given news title",
"DBpediaClassification": "Given an App description text, find the appropriate fine-grained category",
"FinancialPhrasebankClassification": "Classifying sentiment of the customer review into positive, neutral, or negative",
"PoemSentimentClassification": "Classifying sentiment of the customer review into positive, neutral, or negative",
"TweetTopicSingleClassification": "Categorizing the given news title",
"EstonianValenceClassification": "Classifying sentiment of the customer review into positive, neutral, or negative",
"FilipinoShopeeReviewsClassification": "Classifying sentiment of the customer review into positive, neutral, or negative",
"GujaratiNewsClassification": "Categorizing the given news title",
"SentimentAnalysisHindi": "Classifying sentiment of the customer review into positive, neutral, or negative",
"IndonesianIdClickbaitClassification": "Categorizing the given news title",
"ItaCaseholdClassification": "Categorizing the given news title",
"KorSarcasmClassification": "Classifying sentiment of the customer review into positive, neutral, or negative",
"KurdishSentimentClassification": "Classifying sentiment of the customer review into positive, neutral, or negative",
"MacedonianTweetSentimentClassification": "Classifying the sentiment of a given tweet as either positive, negative, or neutral",
"AfriSentiClassification": "Classifying sentiment of the customer review into positive, neutral, or negative",
"CataloniaTweetClassification": "Classifying the sentiment of a given tweet as either positive, negative, or neutral",
"CyrillicTurkicLangClassification": "Given a text, classify its language",
"IndicLangClassification": "Given a text, classify its language",
"MultiHateClassification": "Classifying the given comments as either toxic or not toxic",
"NusaParagraphEmotionClassification": "Classify the emotion expressed in the given Twitter message into one of the six emotions: anger, fear, joy, love, sadness, and surprise",
"NusaX-senti": "Classifying sentiment of the customer review into positive, neutral, or negative",
"SwissJudgementClassification": "Classifying sentiment of the customer review into positive, neutral, or negative",
"NepaliNewsClassification": "Categorizing the given news title",
"OdiaNewsClassification": "Categorizing the given news title",
"PunjabiNewsClassification": "Categorizing the given news title",
"SinhalaNewsClassification": "Categorizing the given news title",
"CSFDSKMovieReviewSentimentClassification": "Classifying the sentiment expressed in the given movie review text from the IMDB dataset",
"SiswatiNewsClassification": "Categorizing the given news title",
"SlovakMovieReviewSentimentClassification": "Classifying the sentiment expressed in the given movie review text from the IMDB dataset",
"SwahiliNewsClassification": "Categorizing the given news title",
"TswanaNewsClassification": "Categorizing the given news title",
"IsiZuluNewsClassification": "Categorizing the given news title",
"WikiCitiesClustering": "Identify the topic or theme of the given news articles",
"RomaniBibleClustering": "Identify the topic or theme of the given news articles",
"ArXivHierarchicalClusteringP2P": "Identify the main and secondary category of Arxiv papers based on the titles and abstracts",
"ArXivHierarchicalClusteringS2S": "Identify the main and secondary category of Arxiv papers based on the titles",
"BigPatentClustering.v2": "Identify the main category of scholar papers based on the titles and abstracts",
"AlloProfClusteringS2S.v2": "Identify the main category of scholar papers based on the titles",
"HALClusteringS2S.v2": "Identify the main category of scholar papers based on the titles",
"SIB200ClusteringS2S": "Identify the topic or theme of the given news articles",
"WikiClusteringP2P.v2": "Identify the topic or theme of the given news articles",
"PlscClusteringP2P.v2": "Identify the main category of scholar papers based on the titles and abstracts",
"KorHateSpeechMLClassification": "Classifying the given comments as either toxic or not toxic",
"MalteseNewsClassification": "Categorizing the given news title",
"MultiEURLEXMultilabelClassification": "Categorizing the given news title",
"BrazilianToxicTweetsClassification": "Classifying the given comments as either toxic or not toxic",
"CTKFactsNLI": "Retrieve semantically similar text",
"indonli": "Retrieve semantically similar text",
"ArmenianParaphrasePC": "Retrieve semantically similar text",
"PawsXPairClassification": "Retrieve semantically similar text",
"RTE3": "Retrieve semantically similar text",
"XNLI": "Retrieve semantically similar text",
"PpcPC": "Retrieve semantically similar text",
"GermanSTSBenchmark": "Retrieve semantically similar text",
"SICK-R": "Retrieve semantically similar text",
"STS13": "Retrieve semantically similar text",
"STS14": "Retrieve semantically similar text",
"STSBenchmark": "Retrieve semantically similar text",
"FaroeseSTS": "Retrieve semantically similar text",
"FinParaSTS": "Retrieve semantically similar text",
"JSICK": "Retrieve semantically similar text",
"IndicCrosslingualSTS": "Retrieve semantically similar text",
"SemRel24STS": "Retrieve semantically similar text",
"STS17": "Retrieve semantically similar text",
"STS22.v2": "Retrieve semantically similar text",
"STSES": "Retrieve semantically similar text",
"STSB": "Retrieve semantically similar text",
"AILAStatutes": "Given a query, retrieve documents that answer the query.",
"HagridRetrieval": "Given a query, retrieve documents that answer the query.",
"LegalBenchCorporateLobbying": "Given a query, retrieve documents that answer the query.",
"LEMBPasskeyRetrieval": "Given a query, retrieve documents that answer the query.",
"BelebeleRetrieval": "Given a query, retrieve documents that answer the query.",
"MLQARetrieval": "Given a query, retrieve documents that answer the query.",
"StatcanDialogueDatasetRetrieval": "Given a query, retrieve documents that answer the query.",
"WikipediaRetrievalMultilingual": "Given a query, retrieve documents that answer the query.",
"Core17InstructionRetrieval": "Given a query, retrieve documents that answer the query.",
"News21InstructionRetrieval": "Given a query, retrieve documents that answer the query.",
"Robust04InstructionRetrieval": "Given a query, retrieve documents that answer the query.",
"WebLINXCandidatesReranking": "Given a query, retrieve documents that answer the query.",
"WikipediaRerankingMultilingual": "Given a query, retrieve documents that answer the query.",
"STS15": "Retrieve semantically similar text",
"MIRACLRetrievalHardNegatives": "Given a question, retrieve passages that answer the question",
"BIOSSES": "Retrieve semantically similar text",
"CQADupstackRetrieval": "Given a question, retrieve detailed question descriptions from Stackexchange that are duplicates to the given question",
"CQADupstackGamingRetrieval": {
"query": "Given a question, retrieve detailed question descriptions from Stackexchange that are duplicates to the given question",
"passage": "Given a question, retrieve detailed question descriptions from Stackexchange that are duplicates to the given question"
},
"CQADupstackUnixRetrieval": {
"query": "Given a question, retrieve detailed question descriptions from Stackexchange that are duplicates to the given question",
"passage": "Given a question, retrieve detailed question descriptions from Stackexchange that are duplicates to the given question"
},
"STS16": "Retrieve semantically similar text",
"SummEval": "Retrieve semantically similar text",
"ATEC": "Retrieve semantically similar text"
}