Commit
·
4f27e41
1
Parent(s):
0495bc2
style: Re-order
Browse files
app.py
CHANGED
|
@@ -160,13 +160,13 @@ class Dataset(BaseModel):
|
|
| 160 |
return hash(self.name)
|
| 161 |
|
| 162 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 163 |
SUMMARISATION = Task(name="summarisation", metric="bertscore")
|
| 164 |
KNOWLEDGE = Task(name="knowledge", metric="mcc")
|
| 165 |
COMMON_SENSE_REASONING = Task(name="common-sense reasoning", metric="mcc")
|
| 166 |
-
GRAMMAR = Task(name="grammar", metric="mcc")
|
| 167 |
-
READING_COMPREHENSION = Task(name="reading comprehension", metric="em")
|
| 168 |
-
TEXT_CLASSIFICATION = Task(name="text classification", metric="mcc")
|
| 169 |
-
INFORMATION_EXTRACTION = Task(name="information extraction", metric="micro_f1_no_misc")
|
| 170 |
ALL_TASKS = [obj for obj in globals().values() if isinstance(obj, Task)]
|
| 171 |
|
| 172 |
DANISH = Language(code="da", name="Danish")
|
|
@@ -184,82 +184,87 @@ ALL_LANGUAGES = {
|
|
| 184 |
}
|
| 185 |
|
| 186 |
DATASETS = [
|
| 187 |
-
Dataset(name="swerec", language=SWEDISH, task=TEXT_CLASSIFICATION),
|
| 188 |
Dataset(name="angry-tweets", language=DANISH, task=TEXT_CLASSIFICATION),
|
| 189 |
-
Dataset(name="
|
| 190 |
-
Dataset(name="sb10k", language=GERMAN, task=TEXT_CLASSIFICATION),
|
| 191 |
-
Dataset(name="dutch-social", language=DUTCH, task=TEXT_CLASSIFICATION),
|
| 192 |
-
Dataset(name="sst5", language=ENGLISH, task=TEXT_CLASSIFICATION),
|
| 193 |
-
Dataset(name="hotter-and-colder-sentiment", language=ICELANDIC, task=TEXT_CLASSIFICATION),
|
| 194 |
-
Dataset(name="fosent", language=FAROESE, task=TEXT_CLASSIFICATION),
|
| 195 |
-
Dataset(name="allocine", language=FRENCH, task=TEXT_CLASSIFICATION),
|
| 196 |
-
Dataset(name="sentipolc16", language=ITALIAN, task=TEXT_CLASSIFICATION),
|
| 197 |
-
|
| 198 |
-
Dataset(name="suc3", language=SWEDISH, task=INFORMATION_EXTRACTION),
|
| 199 |
Dataset(name="dansk", language=DANISH, task=INFORMATION_EXTRACTION),
|
| 200 |
-
Dataset(name="
|
| 201 |
-
Dataset(name="
|
| 202 |
-
Dataset(name="
|
| 203 |
-
Dataset(name="
|
| 204 |
-
Dataset(name="
|
| 205 |
-
Dataset(name="conll-en", language=ENGLISH, task=INFORMATION_EXTRACTION),
|
| 206 |
-
Dataset(name="fone", language=FAROESE, task=INFORMATION_EXTRACTION),
|
| 207 |
-
Dataset(name="eltec", language=FRENCH, task=INFORMATION_EXTRACTION),
|
| 208 |
-
Dataset(name="multinerd-it", language=ITALIAN, task=INFORMATION_EXTRACTION),
|
| 209 |
|
| 210 |
-
Dataset(name="
|
| 211 |
-
Dataset(name="scala-da", language=DANISH, task=GRAMMAR),
|
| 212 |
-
Dataset(name="scala-nb", language=NORWEGIAN, task=GRAMMAR),
|
| 213 |
-
Dataset(name="scala-nn", language=NORWEGIAN, task=GRAMMAR),
|
| 214 |
-
Dataset(name="scala-is", language=ICELANDIC, task=GRAMMAR),
|
| 215 |
-
Dataset(name="scala-de", language=GERMAN, task=GRAMMAR),
|
| 216 |
Dataset(name="scala-nl", language=DUTCH, task=GRAMMAR),
|
| 217 |
-
Dataset(name="
|
| 218 |
-
Dataset(name="
|
| 219 |
-
Dataset(name="
|
| 220 |
-
Dataset(name="
|
|
|
|
| 221 |
|
| 222 |
-
Dataset(name="
|
| 223 |
-
Dataset(name="
|
| 224 |
-
Dataset(name="
|
| 225 |
-
Dataset(name="nqii", language=ICELANDIC, task=READING_COMPREHENSION),
|
| 226 |
-
Dataset(name="germanquad", language=GERMAN, task=READING_COMPREHENSION),
|
| 227 |
Dataset(name="squad", language=ENGLISH, task=READING_COMPREHENSION),
|
| 228 |
-
Dataset(name="
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 229 |
Dataset(name="foqa", language=FAROESE, task=READING_COMPREHENSION),
|
|
|
|
|
|
|
|
|
|
|
|
|
| 230 |
Dataset(name="fquad", language=FRENCH, task=READING_COMPREHENSION),
|
| 231 |
-
Dataset(name="
|
|
|
|
|
|
|
| 232 |
|
| 233 |
-
Dataset(name="
|
|
|
|
|
|
|
|
|
|
| 234 |
Dataset(name="mlsum", language=GERMAN, task=SUMMARISATION),
|
| 235 |
-
Dataset(name="
|
| 236 |
-
Dataset(name="
|
| 237 |
-
Dataset(name="wiki-lingua-nl", language=DUTCH, task=SUMMARISATION),
|
| 238 |
-
Dataset(name="swedn", language=SWEDISH, task=SUMMARISATION),
|
| 239 |
-
Dataset(name="cnn-dailymail", language=ENGLISH, task=SUMMARISATION),
|
| 240 |
-
Dataset(name="orange-sum", language=FRENCH, task=SUMMARISATION),
|
| 241 |
-
Dataset(name="ilpost-sum", language=ITALIAN, task=SUMMARISATION),
|
| 242 |
|
| 243 |
-
Dataset(
|
| 244 |
-
|
| 245 |
-
|
| 246 |
-
Dataset(name="
|
|
|
|
|
|
|
|
|
|
| 247 |
Dataset(name="icelandic-knowledge", language=ICELANDIC, task=KNOWLEDGE),
|
| 248 |
-
Dataset(name="
|
| 249 |
-
|
| 250 |
-
Dataset(name="
|
| 251 |
-
Dataset(name="
|
|
|
|
|
|
|
|
|
|
| 252 |
Dataset(name="mmlu-it", language=ITALIAN, task=KNOWLEDGE),
|
|
|
|
| 253 |
|
| 254 |
-
Dataset(name="
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 255 |
Dataset(name="nor-common-sense-qa", language=NORWEGIAN, task=COMMON_SENSE_REASONING),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 256 |
Dataset(name="hellaswag-sv", language=SWEDISH, task=COMMON_SENSE_REASONING),
|
| 257 |
-
Dataset(name="winogrande-is", language=ICELANDIC, task=COMMON_SENSE_REASONING),
|
| 258 |
-
Dataset(name="hellaswag-de", language=GERMAN, task=COMMON_SENSE_REASONING),
|
| 259 |
-
Dataset(name="hellaswag-nl", language=DUTCH, task=COMMON_SENSE_REASONING),
|
| 260 |
-
Dataset(name="hellaswag", language=ENGLISH, task=COMMON_SENSE_REASONING),
|
| 261 |
-
Dataset(name="hellaswag-fr", language=FRENCH, task=COMMON_SENSE_REASONING),
|
| 262 |
-
Dataset(name="hellaswag-it", language=ITALIAN, task=COMMON_SENSE_REASONING),
|
| 263 |
]
|
| 264 |
|
| 265 |
|
|
|
|
| 160 |
return hash(self.name)
|
| 161 |
|
| 162 |
|
| 163 |
+
TEXT_CLASSIFICATION = Task(name="text classification", metric="mcc")
|
| 164 |
+
GRAMMAR = Task(name="grammar", metric="mcc")
|
| 165 |
+
INFORMATION_EXTRACTION = Task(name="information extraction", metric="micro_f1_no_misc")
|
| 166 |
+
READING_COMPREHENSION = Task(name="reading comprehension", metric="em")
|
| 167 |
SUMMARISATION = Task(name="summarisation", metric="bertscore")
|
| 168 |
KNOWLEDGE = Task(name="knowledge", metric="mcc")
|
| 169 |
COMMON_SENSE_REASONING = Task(name="common-sense reasoning", metric="mcc")
|
|
|
|
|
|
|
|
|
|
|
|
|
| 170 |
ALL_TASKS = [obj for obj in globals().values() if isinstance(obj, Task)]
|
| 171 |
|
| 172 |
DANISH = Language(code="da", name="Danish")
|
|
|
|
| 184 |
}
|
| 185 |
|
| 186 |
DATASETS = [
|
|
|
|
| 187 |
Dataset(name="angry-tweets", language=DANISH, task=TEXT_CLASSIFICATION),
|
| 188 |
+
Dataset(name="scala-da", language=DANISH, task=GRAMMAR),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 189 |
Dataset(name="dansk", language=DANISH, task=INFORMATION_EXTRACTION),
|
| 190 |
+
Dataset(name="scandiqa-da", language=DANISH, task=READING_COMPREHENSION),
|
| 191 |
+
Dataset(name="nordjylland-news", language=DANISH, task=SUMMARISATION),
|
| 192 |
+
Dataset(name="danish-citizen-tests", language=DANISH, task=KNOWLEDGE),
|
| 193 |
+
Dataset(name="danske-talemaader", language=DANISH, task=KNOWLEDGE),
|
| 194 |
+
Dataset(name="hellaswag-da", language=DANISH, task=COMMON_SENSE_REASONING),
|
|
|
|
|
|
|
|
|
|
|
|
|
| 195 |
|
| 196 |
+
Dataset(name="dutch-social", language=DUTCH, task=TEXT_CLASSIFICATION),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 197 |
Dataset(name="scala-nl", language=DUTCH, task=GRAMMAR),
|
| 198 |
+
Dataset(name="conll-nl", language=DUTCH, task=INFORMATION_EXTRACTION),
|
| 199 |
+
Dataset(name="squad-nl", language=DUTCH, task=READING_COMPREHENSION),
|
| 200 |
+
Dataset(name="wiki-lingua-nl", language=DUTCH, task=SUMMARISATION),
|
| 201 |
+
Dataset(name="mmlu-nl", language=DUTCH, task=KNOWLEDGE),
|
| 202 |
+
Dataset(name="hellaswag-nl", language=DUTCH, task=COMMON_SENSE_REASONING),
|
| 203 |
|
| 204 |
+
Dataset(name="sst5", language=ENGLISH, task=TEXT_CLASSIFICATION),
|
| 205 |
+
Dataset(name="scala-en", language=ENGLISH, task=GRAMMAR),
|
| 206 |
+
Dataset(name="conll-en", language=ENGLISH, task=INFORMATION_EXTRACTION),
|
|
|
|
|
|
|
| 207 |
Dataset(name="squad", language=ENGLISH, task=READING_COMPREHENSION),
|
| 208 |
+
Dataset(name="cnn-dailymail", language=ENGLISH, task=SUMMARISATION),
|
| 209 |
+
Dataset(name="mmlu", language=ENGLISH, task=KNOWLEDGE),
|
| 210 |
+
Dataset(name="hellaswag", language=ENGLISH, task=COMMON_SENSE_REASONING),
|
| 211 |
+
|
| 212 |
+
Dataset(name="fosent", language=FAROESE, task=TEXT_CLASSIFICATION),
|
| 213 |
+
Dataset(name="scala-fo", language=FAROESE, task=GRAMMAR),
|
| 214 |
+
Dataset(name="fone", language=FAROESE, task=INFORMATION_EXTRACTION),
|
| 215 |
Dataset(name="foqa", language=FAROESE, task=READING_COMPREHENSION),
|
| 216 |
+
|
| 217 |
+
Dataset(name="allocine", language=FRENCH, task=TEXT_CLASSIFICATION),
|
| 218 |
+
Dataset(name="scala-fr", language=FRENCH, task=GRAMMAR),
|
| 219 |
+
Dataset(name="eltec", language=FRENCH, task=INFORMATION_EXTRACTION),
|
| 220 |
Dataset(name="fquad", language=FRENCH, task=READING_COMPREHENSION),
|
| 221 |
+
Dataset(name="orange-sum", language=FRENCH, task=SUMMARISATION),
|
| 222 |
+
Dataset(name="mmlu-fr", language=FRENCH, task=KNOWLEDGE),
|
| 223 |
+
Dataset(name="hellaswag-fr", language=FRENCH, task=COMMON_SENSE_REASONING),
|
| 224 |
|
| 225 |
+
Dataset(name="sb10k", language=GERMAN, task=TEXT_CLASSIFICATION),
|
| 226 |
+
Dataset(name="scala-de", language=GERMAN, task=GRAMMAR),
|
| 227 |
+
Dataset(name="germeval", language=GERMAN, task=INFORMATION_EXTRACTION),
|
| 228 |
+
Dataset(name="germanquad", language=GERMAN, task=READING_COMPREHENSION),
|
| 229 |
Dataset(name="mlsum", language=GERMAN, task=SUMMARISATION),
|
| 230 |
+
Dataset(name="mmlu-de", language=GERMAN, task=KNOWLEDGE),
|
| 231 |
+
Dataset(name="hellaswag-de", language=GERMAN, task=COMMON_SENSE_REASONING),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 232 |
|
| 233 |
+
Dataset(
|
| 234 |
+
name="hotter-and-colder-sentiment", language=ICELANDIC, task=TEXT_CLASSIFICATION
|
| 235 |
+
),
|
| 236 |
+
Dataset(name="scala-is", language=ICELANDIC, task=GRAMMAR),
|
| 237 |
+
Dataset(name="mim-gold-ner", language=ICELANDIC, task=INFORMATION_EXTRACTION),
|
| 238 |
+
Dataset(name="nqii", language=ICELANDIC, task=READING_COMPREHENSION),
|
| 239 |
+
Dataset(name="rrn", language=ICELANDIC, task=SUMMARISATION),
|
| 240 |
Dataset(name="icelandic-knowledge", language=ICELANDIC, task=KNOWLEDGE),
|
| 241 |
+
Dataset(name="winogrande-is", language=ICELANDIC, task=COMMON_SENSE_REASONING),
|
| 242 |
+
|
| 243 |
+
Dataset(name="sentipolc16", language=ITALIAN, task=TEXT_CLASSIFICATION),
|
| 244 |
+
Dataset(name="scala-it", language=ITALIAN, task=GRAMMAR),
|
| 245 |
+
Dataset(name="multinerd-it", language=ITALIAN, task=INFORMATION_EXTRACTION),
|
| 246 |
+
Dataset(name="squad-it", language=ITALIAN, task=READING_COMPREHENSION),
|
| 247 |
+
Dataset(name="ilpost-sum", language=ITALIAN, task=SUMMARISATION),
|
| 248 |
Dataset(name="mmlu-it", language=ITALIAN, task=KNOWLEDGE),
|
| 249 |
+
Dataset(name="hellaswag-it", language=ITALIAN, task=COMMON_SENSE_REASONING),
|
| 250 |
|
| 251 |
+
Dataset(name="norec", language=NORWEGIAN, task=TEXT_CLASSIFICATION),
|
| 252 |
+
Dataset(name="scala-nb", language=NORWEGIAN, task=GRAMMAR),
|
| 253 |
+
Dataset(name="scala-nn", language=NORWEGIAN, task=GRAMMAR),
|
| 254 |
+
Dataset(name="norne-nb", language=NORWEGIAN, task=INFORMATION_EXTRACTION),
|
| 255 |
+
Dataset(name="norne-nn", language=NORWEGIAN, task=INFORMATION_EXTRACTION),
|
| 256 |
+
Dataset(name="norquad", language=NORWEGIAN, task=READING_COMPREHENSION),
|
| 257 |
+
Dataset(name="no-sammendrag", language=NORWEGIAN, task=SUMMARISATION),
|
| 258 |
+
Dataset(name="nrk-quiz-qa", language=NORWEGIAN, task=KNOWLEDGE),
|
| 259 |
Dataset(name="nor-common-sense-qa", language=NORWEGIAN, task=COMMON_SENSE_REASONING),
|
| 260 |
+
|
| 261 |
+
Dataset(name="swerec", language=SWEDISH, task=TEXT_CLASSIFICATION),
|
| 262 |
+
Dataset(name="scala-sv", language=SWEDISH, task=GRAMMAR),
|
| 263 |
+
Dataset(name="suc3", language=SWEDISH, task=INFORMATION_EXTRACTION),
|
| 264 |
+
Dataset(name="scandiqa-sv", language=SWEDISH, task=READING_COMPREHENSION),
|
| 265 |
+
Dataset(name="swedn", language=SWEDISH, task=SUMMARISATION),
|
| 266 |
+
Dataset(name="mmlu-sv", language=SWEDISH, task=KNOWLEDGE),
|
| 267 |
Dataset(name="hellaswag-sv", language=SWEDISH, task=COMMON_SENSE_REASONING),
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 268 |
]
|
| 269 |
|
| 270 |
|