Geralt-Targaryen commited on
Commit
35baae5
·
verified ·
1 Parent(s): 0311ad7

Update config_sentence_transformers.json

Browse files
Files changed (1) hide show
  1. config_sentence_transformers.json +7 -240
config_sentence_transformers.json CHANGED
@@ -1,241 +1,8 @@
1
  {
2
- "prompts": {
3
- "STS": "Retrieve semantically similar text.",
4
- "BitextMining": "Retrieve translations of the following text.",
5
- "Classification": "Classify the topic of the given text.",
6
- "MultilabelClassification": "Classify the topic of the given text.",
7
- "Clustering": "Classify the topic of the given text.",
8
- "PairClassification": "Retrieve semantically entailed text.",
9
- "query": "Given a question, retrieve passages that can help answer the question.",
10
- "document": "",
11
- "BulgarianStoreReviewSentimentClassfication": "Classify the sentiment of the given text.",
12
- "CzechProductReviewSentimentClassification": "Classify the sentiment of the given text.",
13
- "FinancialPhrasebankClassification": "Classify the sentiment of the given text.",
14
- "PoemSentimentClassification": "Classify the sentiment of the given text.",
15
- "EstonianValenceClassification": "Classify the sentiment of the given text.",
16
- "FilipinoShopeeReviewsClassification": "Classify the sentiment of the given text.",
17
- "SentimentAnalysisHindi": "Classify the sentiment of the given text.",
18
- "KurdishSentimentClassification": "Classify the sentiment of the given text.",
19
- "MacedonianTweetSentimentClassification": "Classify the sentiment of the given text.",
20
- "AfriSentiClassification": "Classify the sentiment of the given text.",
21
- "CataloniaTweetClassification": "Classify the sentiment of the given text.",
22
- "MultiHateClassification": "Classify the sentiment of the given text.",
23
- "NusaParagraphEmotionClassification": "Classify the sentiment of the given text.",
24
- "NusaX-senti": "Classify the sentiment of the given text.",
25
- "SwissJudgementClassification": "Classify the sentiment of the given text.",
26
- "PolEmo2.0-OUT": "Classify the sentiment of the given text.",
27
- "CSFDSKMovieReviewSentimentClassification": "Classify the sentiment of the given text.",
28
- "SlovakMovieReviewSentimentClassification": "Classify the sentiment of the given text.",
29
- "CyrillicTurkicLangClassification": "Classify the text into its language.",
30
- "IndicLangClassification": "Classify the text into its language.",
31
- "NordicLangClassification": "Classify the text into its language.",
32
- "ScalaClassification": "Classify the given sentence as linguistically acceptable or not acceptable.",
33
- "DalajClassification": "Classify the given sentence as linguistically acceptable or not acceptable.",
34
- "ToxicConversationsClassification": "Classify the given comments as either toxic or not toxic.",
35
- "IndonesianIdClickbaitClassification": "Classify the given text as either clickbait or not clickbait.",
36
- "KorSarcasmClassification": "Classify the given text as either sarcasm or not sarcasm.",
37
- "AmazonCounterfactualClassification": "Classify a given Amazon customer review text as either counterfactual or not counterfactual.",
38
- "MassiveIntentClassification": "Given a user utterance as query, find the user intents.",
39
- "PAC": "Classify the given clause as either abusive or not abusive.",
40
- "Banking77Classification": "Given an online banking query, find the corresponding intents.",
41
- "ImdbClassification": "Classify the sentiment expressed in the given movie review text from the IMDB dataset.",
42
- "MTOPDomainClassification": "Classify the intent domain of the given utterance in task-oriented conversation.",
43
- "MassiveScenarioClassification": "Given a user utterance as query, find the user scenarios.",
44
- "TweetSentimentExtractionClassification": "Classify the sentiment of a given tweet as either positive, negative, or neutral",
45
- "WikiCitiesClustering": "Classify the following city description by country.",
46
- "ArXivHierarchicalClusteringP2P": "Identify the main and secondary category of arXiv papers based on the titles and abstracts.",
47
- "ArXivHierarchicalClusteringS2S": "Identify the main and secondary category of arXiv papers based on the titles.",
48
- "BiorxivClusteringP2P.v2": "Identify the main category of bioRxiv papers based on the titles and abstracts.",
49
- "MedrxivClusteringP2P.v2": "Identify the main category of medRxiv papers based on the titles and abstracts.",
50
- "StackExchangeClustering.v2": "Identify the topic or theme of StackExchange posts based on the titles.",
51
- "StackExchangeClusteringP2P.v2": "Identify the topic or theme of StackExchange posts based on the given paragraphs.",
52
- "MedrxivClusteringS2S.v2": "Identify the main category of medRxiv papers based on the titles.",
53
- "TwentyNewsgroupsClustering.v2": "Identify the topic or theme of the given news articles.",
54
- "SprintDuplicateQuestions": "Retrieve duplicate questions from Sprint forum.",
55
- "TwitterURLCorpus": "Retrieve tweets that are semantically similar to the given tweet.",
56
- "ArmenianParaphrasePC": "Retrieve paraphrases of the given sentence.",
57
- "OpusparcusPC": "Retrieve paraphrases of the given sentence.",
58
- "PawsXPairClassification": "Retrieve paraphrases of the given sentence.",
59
- "PpcPC": "Retrieve paraphrases of the given sentence.",
60
- "TwitterSemEval2015": "Retrieve tweets that are semantically similar to the given tweet.",
61
- "KorHateSpeechMLClassification": "Classify the sentiment of the given text.",
62
- "CEDRClassification": "Classify the emotion expressed in the given comment into: joy, sadness, surprise, fear, and anger.",
63
- "SummEvalSummarization.v2": "Given a news summary, retrieve other semantically similar summaries.",
64
- "AppsRetrieval": "Retrieve the most relevant code snippet for the given query.",
65
- "CodeEditSearchRetrieval": "Retrieve the most relevant code edit.",
66
- "CodeFeedbackMT": "Retrieve the most relevant response for the given query.",
67
- "CodeFeedbackST": "Retrieve the most relevant response for the given query.",
68
- "CodeSearchNetCCRetrieval": "Retrieve the most relevant code snippet for the given code snippet.",
69
- "CodeSearchNetRetrieval": "Retrieve the most relevant code snippet for the given query.",
70
- "CodeTransOceanContest": "Retrieve similar code to the given source code.",
71
- "CodeTransOceanDL": "Retrieve similar code to the given source code.",
72
- "CosQA": "Retrieve the most relevant code snippet for the given query.",
73
- "COIRCodeSearchNetRetrieval": "Retrieve the most relevant code summary for the given code snippet.",
74
- "StackOverflowQA": "Retrieve the most relevant response for the given query.",
75
- "SyntheticText2SQL": "Retrieve the most relevant sql code snippet for the given query.",
76
- "AILAStatutes": "Identify the most relevant statutes for the given situation.",
77
- "ArguAna": "Given a claim, find documents that refute the claim.",
78
- "LegalBenchCorporateLobbying": "Given a bill title, retrieve the corresponding bill summary.",
79
- "SCIDOCS": "Given a scientific paper title, retrieve paper abstracts that are cited by the given paper.",
80
- "TRECCOVID": "Given a query on COVID-19, retrieve documents that answer the query.",
81
- "CovidRetrieval": "Given a query on COVID-19, retrieve documents that answer the query.",
82
- "CQADupstackGamingRetrieval": "Given a question, retrieve questions that are semantically equivalent.",
83
- "CQADupstackUnixRetrieval": "Given a question, retrieve questions that are semantically equivalent.",
84
- "ClimateFEVERHardNegatives": "Given a claim about climate change, retrieve documents that support or refute the claim.",
85
- "FEVERHardNegatives": "Given a claim, retrieve documents that support or refute the claim.",
86
- "FiQA2018": "Given a financial question, retrieve passages that answer the question.",
87
- "HotpotQAHardNegatives": "Given a multi-hop question, retrieve passages that answer the question.",
88
- "Touche2020Retrieval.v3": "Given a question, retrieve passages that answer the question.",
89
- "WebLINXCandidatesReranking": "Given a web navigation step, retrieve relevant elements.",
90
- "AskUbuntuDupQuestions": "Retrieve duplicate questions from AskUbuntu forum.",
91
- "MindSmallReranking": "Retrieve relevant news articles based on user browsing history.",
92
- "NFCorpus": "Given a question, retrieve passages that answer the question.",
93
- "TRECCOVID-PL": "Given a query on COVID-19, retrieve documents that answer the query.",
94
- "SciFact": "Given a scientific claim, retrieve passages that support or refute the claim.",
95
- "SciFact-PL": "Given a scientific claim, retrieve passages that support or refute the claim.",
96
- "CmedqaRetrieval": "Given a question, retrieve passages that answer the question.",
97
- "CMedQAv2-reranking": "Given a question, retrieve passages that answer the question.",
98
- "AngryTweetsClassification": "Classify the sentiment of the given text.",
99
- "DanishPoliticalCommentsClassification": "Classify the sentiment of the given text.",
100
- "DKHateClassification": "Classify the given comments as either offensive or not offensive.",
101
- "LccSentimentClassification": "Classify the sentiment of the given text.",
102
- "NoRecClassification": "Classify the sentiment of the given text.",
103
- "NorwegianParliamentClassification": "Classify the sentiment of the given text.",
104
- "SwedishSentimentClassification": "Classify the sentiment of the given text.",
105
- "SweRecClassification": "Classify the sentiment of the given text.",
106
- "DanFeverRetrieval": "Given a claim, retrieve documents that support or refute the claim.",
107
- "SNLRetrieval": "Given a summary, retrieve the original article.",
108
- "SwednRetrieval": "Given a summary, retrieve the original article.",
109
- "TV2Nordretrieval": "Given a news summary, retrieve the original article.",
110
- "BengaliSentimentAnalysis": "Classify the sentiment of the given text.",
111
- "HindiDiscourseClassification": "Classify the given text into one of the five discourse modes: argumentative, narrative, descriptive, dialogic, and informative.",
112
- "MTOPIntentClassification": "Classify the intent of the given utterance in task-oriented conversation.",
113
- "TweetSentimentClassification": "Classify the sentiment of the given text.",
114
- "UrduRomanSentimentClassification": "Classify the sentiment of the given text as either positive, negative, or neutral.",
115
- "AmazonReviewsClassification": "Classify the given Amazon review into its appropriate rating category.",
116
- "BlurbsClusteringP2P": "Classify the given book title and blurb into its genre.",
117
- "BlurbsClusteringS2S": "Classify the given book title into its genre.",
118
- "FalseFriendsGermanEnglish": "Retrieve translations of the following text.",
119
- "XMarket": "Given a product name search, retrieve the corresponding product description.",
120
- "GerDaLIR": "Retrieve documents that are referenced by the given text.",
121
- "MLSUMClusteringP2P": "Classify the topic of the given news article.",
122
- "SummEvalFr": "Given a news summary, retrieve other semantically similar summaries.",
123
- "AllegroReviews": "Classify the sentiment of the given text.",
124
- "CBD": "Classify the given text as either cyberbullying or not.",
125
- "PolEmo2.0-IN": "Classify the sentiment of the given text.",
126
- "PSC": "Retrieve semantically similar text.",
127
- "EcomRetrieval": "Given a product name query, retrieve the corresponding product description.",
128
- "MedicalRetrieval": "Retrieve the most relevant response for the given query.",
129
- "VideoRetrieval": "Given a video search query, retrieve the titles of relevant videos.",
130
- "CMedQAv1-reranking": "Retrieve the most relevant response for the given query.",
131
- "Waimai": "Classify the sentiment of the given review as either positive or negative.",
132
- "OnlineShopping": "Classify the sentiment of the given review as either positive or negative.",
133
- "JDReview": "Classify the sentiment of the given review as either positive or negative.",
134
- "MultilingualSentiment": "Classify the sentiment of the given review as either positive, negative, or neutral.",
135
- "ToxicChatClassification": "Classify the given text as either toxic or not toxic.",
136
- "JapaneseSentimentClassification": "Classify the sentiment of the given text.",
137
- "WRIMEClassification": "Classify the sentiment of the given text.",
138
- "NLPJournalTitleAbsRetrieval.V2": "Given a paper's title, retrieve the corresponding abstract.",
139
- "NLPJournalTitleIntroRetrieval.V2": "Given a paper's title, retrieve the corresponding introduction.",
140
- "NLPJournalAbsIntroRetrieval.V2": "Given a paper's abstract, retrieve the corresponding introduction.",
141
- "NLPJournalAbsArticleRetrieval.V2": "Given a paper's abstract, retrieve the corresponding paper.",
142
- "ESCIReranking": "Given a product name query, retrieve the corresponding product description.",
143
- "DutchBookReviewSentimentClassification.v2": "Classify the sentiment of the given text.",
144
- "VaccinChatNLClassification": "Classify the intent of the given utterance.",
145
- "DutchColaClassification": "Classify the given sentence as linguistically acceptable or not acceptable.",
146
- "DutchGovernmentBiasClassification": "Classify the given government document as biased or unbiased.",
147
- "DutchSarcasticHeadlinesClassification": "Classify the given newspaper headline as sarcastic or not sarcastic.",
148
- "XLWICNLPairClassification": "Retrieve semantically similar text.",
149
- "CovidDisinformationNLMultiLabelClassification": "Classify the given social media post related to COVID-19 into its misinformation category.",
150
- "VABBClusteringS2S": "Identify the main category of the given paper based on the title.",
151
- "VABBClusteringP2P": "Identify the main category of the given paper based on the title and abstract.",
152
- "ArguAna-NL.v2": "Given a claim, find documents that refute the claim.",
153
- "SCIDOCS-NL.v2": "Given a scientific paper title, retrieve paper abstracts that are cited by the given paper.",
154
- "SciFact-NL.v2": "Given a scientific claim, retrieve passages that support or refute the claim.",
155
- "DutchNewsArticlesRetrieval": "Given a news title, retrieve the original article.",
156
- "OpenTenderRetrieval": "Given a title, retrieve the corresponding article.",
157
- "VABBRetrieval": "Given a paper's title, retrieve the corresponding abstract.",
158
- "GeoreviewClassification": "Classify the given review into its appropriate rating category.",
159
- "InappropriatenessClassification": "Classify the given message as either sensitive topic or not.",
160
- "KinopoiskClassification": "Classify the sentiment of the given movie review.",
161
- "RuReviewsClassification": "Classify the sentiment of the given review as either positive, negative, or neutral.",
162
- "RuSciBenchGRNTIClassification": "Identify the main category of the given paper based on the title and abstract.",
163
- "RuSciBenchOECDClassification": "Identify the main category of the given paper based on the title and abstract.",
164
- "GeoreviewClusteringP2P": "Identify the organization category based on the given review.",
165
- "RuSciBenchGRNTIClusteringP2P": "Identify the main category of the given paper based on the title and abstract.",
166
- "RuSciBenchOECDClusteringP2P": "Identify the main category of the given paper based on the title and abstract.",
167
- "SensitiveTopicsClassification": "Classify the given text into sensitive topics.",
168
- "RiaNewsRetrievalHardNegatives.v2": "Given a news title, retrieve the original article.",
169
- "PersianFoodSentimentClassification": "Classify the sentiment of the given text as either positive or negative.",
170
- "SynPerChatbotConvSAClassification": "Classify the sentiment of the given text.",
171
- "SynPerChatbotConvSAToneChatbotClassification": "Classify the sentiment of the given text.",
172
- "SynPerChatbotConvSAToneUserClassification": "Classify the sentiment of the given text.",
173
- "SynPerChatbotSatisfactionLevelClassification": "Classify the satisfaction level of the given text.",
174
- "SynPerTextToneClassification.v3": "Classify the tone of the given text.",
175
- "DeepSentiPers.v2": "Classify the sentiment of the given text.",
176
- "PersianTextEmotion.v2": "Classify the emotion expressed in the given text into: joy, sadness, surprise, fear, anger, and love.",
177
- "StyleClassification": "Classify the style of the given text as either formal or informal.",
178
- "PerShopDomainClassification": "Classify the domain of the given utterance in shopping dialogue.",
179
- "PerShopIntentClassification": "Classify the intent of the given utterance in shopping dialogue.",
180
- "SynPerChatbotRAGFAQPC": "Retrieve the most relevant response for the given query.",
181
- "FarsiParaphraseDetection": "Retrieve semantically similar text.",
182
- "SynPerTextKeywordsPC": "Identify keywords in the given text.",
183
- "SynPerQAPC": "Retrieve the most relevant response for the given query.",
184
- "ParsinluQueryParaphPC": "Retrieve semantically similar text.",
185
- "SynPerChatbotRAGFAQRetrieval": "Retrieve the most relevant response for the given query.",
186
- "HotpotQA-FaHardNegatives": "Given a multi-hop question, retrieve passages that answer the question.",
187
- "ArguAna-Fa.v2": "Given a claim, find documents that refute the claim.",
188
- "QuoraRetrieval-Fa.v2": "Retrieve questions that are semantically equivalent to the given one.",
189
- "SCIDOCS-Fa.v2": "Given a scientific paper title, retrieve paper abstracts that are cited by the given paper.",
190
- "SciFact-Fa.v2": "Given a scientific claim, retrieve passages that support or refute the claim.",
191
- "TRECCOVID-Fa.v2": "Given a query on COVID-19, retrieve documents that answer the query.",
192
- "FEVER-FaHardNegatives": "Given a claim, retrieve documents that support or refute the claim.",
193
- "SAMSumFa": "Retrieve the most relevant summary for the given conversation.",
194
- "SynPerChatbotSumSRetrieval": "Retrieve the most relevant summary for the given conversation.",
195
- "SynPerChatbotRAGSumSRetrieval": "Retrieve the most relevant summary for the given conversation.",
196
- "ArguAna-VN": "Given a claim, find documents that refute the claim.",
197
- "SciFact-VN": "Given a scientific claim, retrieve passages that support or refute the claim.",
198
- "ClimateFEVER-VN": "Given a claim about climate change, retrieve documents that support or refute the claim.",
199
- "FEVER-VN": "Given a claim, retrieve documents that support or refute the claim.",
200
- "DBPedia-VN": "Given a query, retrieve relevant entity descriptions.",
201
- "HotpotQA-VN": "Given a multi-hop question, retrieve passages that answer the question.",
202
- "TRECCOVID-VN": "Given a query on COVID-19, retrieve documents that answer the query.",
203
- "SCIDOCS-VN": "Given a scientific paper title, retrieve paper abstracts that are cited by the given paper.",
204
- "Quora-VN": "Retrieve questions that are semantically equivalent to the given one.",
205
- "CQADupstackAndroid-VN": "Given a question, retrieve questions that are semantically equivalent.",
206
- "CQADupstackGis-VN": "Given a question, retrieve questions that are semantically equivalent.",
207
- "CQADupstackMathematica-VN": "Given a question, retrieve questions that are semantically equivalent.",
208
- "CQADupstackPhysics-VN": "Given a question, retrieve questions that are semantically equivalent.",
209
- "CQADupstackProgrammers-VN": "Given a question, retrieve questions that are semantically equivalent.",
210
- "CQADupstackStats-VN": "Given a question, retrieve questions that are semantically equivalent.",
211
- "CQADupstackTex-VN": "Given a question, retrieve questions that are semantically equivalent.",
212
- "CQADupstackUnix-VN": "Given a question, retrieve questions that are semantically equivalent.",
213
- "CQADupstackWebmasters-VN": "Given a question, retrieve questions that are semantically equivalent.",
214
- "CQADupstackWordpress-VN": "Given a question, retrieve questions that are semantically equivalent.",
215
- "Banking77VNClassification": "Given an online banking query, find the corresponding intents.",
216
- "EmotionVNClassification": "Classify the emotion expressed in the given Twitter message into one of the six emotions: anger, fear, joy, love, sadness, and surprise.",
217
- "AmazonCounterfactualVNClassification": "Classify a given Amazon customer review text as either counterfactual or not counterfactual.",
218
- "MTOPDomainVNClassification": "Classify the intent domain of the given utterance in task-oriented conversation.",
219
- "TweetSentimentExtractionVNClassification": "Classify the sentiment of a given tweet as either positive, negative, or neutral",
220
- "ToxicConversationsVNClassification": "Classify the given comments as either toxic or not toxic.",
221
- "ImdbVNClassification": "Classify the sentiment expressed in the given movie review text from the IMDB dataset.",
222
- "MTOPIntentVNClassification": "Classify the intent of the given utterance in task-oriented conversation.",
223
- "MassiveScenarioVNClassification": "Given a user utterance as query, find the user scenarios.",
224
- "MassiveIntentVNClassification": "Given a user utterance as query, find the user intents.",
225
- "AmazonReviewsVNClassification": "Classify the given Amazon review into its appropriate rating category.",
226
- "AmazonPolarityVNClassification": "Classify the given Amazon review as either positive or negative.",
227
- "SprintDuplicateQuestions-VN": "Retrieve duplicate questions from Sprint forum.",
228
- "TwitterSemEval2015-VN": "Retrieve tweets that are semantically similar to the given tweet.",
229
- "TwitterURLCorpus-VN": "Retrieve tweets that are semantically similar to the given tweet.",
230
- "TwentyNewsgroupsClustering-VN": "Identify the topic or theme of the given news articles.",
231
- "RedditClusteringP2P-VN": "Identify the topic or theme of Reddit posts based on the titles and posts.",
232
- "StackExchangeClusteringP2P-VN": "Identify the topic or theme of StackExchange posts based on the given titles and paragraphs.",
233
- "StackExchangeClustering-VN": "Identify the topic or theme of StackExchange posts based on the titles.",
234
- "RedditClustering-VN": "Identify the topic or theme of Reddit posts based on the titles.",
235
- "SciDocsRR-VN": "Given a title of a scientific paper, retrieve the titles of other relevant papers.",
236
- "AskUbuntuDupQuestions-VN": "Retrieve duplicate questions from AskUbuntu forum.",
237
- "StackOverflowDupQuestions-VN": "Retrieve duplicate questions from StackOverflow forum."
238
- },
239
- "default_prompt_name": null,
240
- "similarity_fn_name": "cosine"
241
- }
 
1
  {
2
+ "prompts": {
3
+ "query": "Instruct: Given a question, retrieve passages that can help answer the question.\nQuery: ",
4
+ "document": ""
5
+ },
6
+ "default_prompt_name": null,
7
+ "similarity_fn_name": "cosine"
8
+ }