Initial clone with modifications
Browse files- src/__pycache__/tasks.cpython-310.pyc +0 -0
- src/about.py +2 -2
- src/tasks.py +6 -6
src/__pycache__/tasks.cpython-310.pyc
CHANGED
|
Binary files a/src/__pycache__/tasks.cpython-310.pyc and b/src/__pycache__/tasks.cpython-310.pyc differ
|
|
|
src/about.py
CHANGED
|
@@ -139,8 +139,8 @@ TITLE = """<h1 align="center" id="space-title">๐ ECREAM-LLM Leaderboard ๐<
|
|
| 139 |
# What does your leaderboard evaluate?
|
| 140 |
INTRODUCTION_TEXT = """
|
| 141 |
<br><br><b>The eCream-LLM leaderboard </b>, developed within <a href='https://ecreamproject.eu/'> the eCream Project </a> (enabling Clinical Research in Emergency and Acute care Medicine), is designed to evaluate Large Language Models (LLMs) on several tasks pertaining to the medical domain. Its distinguishing features are:<b> <br> (i) all tasks are implemented for six languages including English, Italian, Slovak, Slovenian, Polish and Greek; <br> (ii) the leaderboard includes generative tasks, allowing for a more natural interaction with LLMs; <br> (iii) all tasks are evaluated against multiple prompts, this way mitigating the model sensitivity to specific prompts and allowing a fairer evaluation.</b>
|
| 142 |
-
<br><br>**<small>Generative tasks:</small>** <small> ๐ท๏ธNER (Named Entity Recognition), ๐REL (Relation Extraction), ๐RML(CRF RML) </small>
|
| 143 |
-
<br>**<small>Multiple-choice task:</small>** <small> ๐ฅDIA (CRF Diagnosis), ๐HIS (CRF History) </small>
|
| 144 |
|
| 145 |
"""
|
| 146 |
|
|
|
|
| 139 |
# What does your leaderboard evaluate?
|
| 140 |
INTRODUCTION_TEXT = """
|
| 141 |
<br><br><b>The eCream-LLM leaderboard </b>, developed within <a href='https://ecreamproject.eu/'> the eCream Project </a> (enabling Clinical Research in Emergency and Acute care Medicine), is designed to evaluate Large Language Models (LLMs) on several tasks pertaining to the medical domain. Its distinguishing features are:<b> <br> (i) all tasks are implemented for six languages including English, Italian, Slovak, Slovenian, Polish and Greek; <br> (ii) the leaderboard includes generative tasks, allowing for a more natural interaction with LLMs; <br> (iii) all tasks are evaluated against multiple prompts, this way mitigating the model sensitivity to specific prompts and allowing a fairer evaluation.</b>
|
| 142 |
+
<br><br>**<small>Generative tasks:</small>** <small> ๐ท๏ธNER-E3C (Named Entity Recognition - E3C), ๐REL-E3C (Relation Extraction -E3C), ๐CRF-RML(CRF RML), NER-PHA ( Named Entity Recognition - PharamaER.IT) </small>
|
| 143 |
+
<br>**<small>Multiple-choice task:</small>** <small> ๐ฅCRF-DIA (CRF Diagnosis), ๐CRF-HIS (CRF History) </small>
|
| 144 |
|
| 145 |
"""
|
| 146 |
|
src/tasks.py
CHANGED
|
@@ -254,15 +254,15 @@ NER_PHARMAER_DESCRIPTION = """### Named Entity Recognition over (NER) over Pha
|
|
| 254 |
|
| 255 |
# Create a dictionary to map task names to their descriptions
|
| 256 |
TASK_DESCRIPTIONS = {
|
| 257 |
-
"RML
|
| 258 |
-
"DIA
|
| 259 |
-
"HIS
|
| 260 |
"AT": AT_DESCRIPTION,
|
| 261 |
"WIC": WIC_DESCRIPTION,
|
| 262 |
"FAQ": FAQ_DESCRIPTION,
|
| 263 |
"LS": LS_DESCRIPTION,
|
| 264 |
"SU": SU_DESCRIPTION,
|
| 265 |
-
"NER": NER_DESCRIPTION,
|
| 266 |
-
"REL": REL_DESCRIPTION,
|
| 267 |
-
"NER-
|
| 268 |
}
|
|
|
|
| 254 |
|
| 255 |
# Create a dictionary to map task names to their descriptions
|
| 256 |
TASK_DESCRIPTIONS = {
|
| 257 |
+
"CRF-RML": RML_DESCRIPTION,
|
| 258 |
+
"CRF-DIA": DIA_DESCRIPTION,
|
| 259 |
+
"CRF-HIS": HIS_DESCRIPTION,
|
| 260 |
"AT": AT_DESCRIPTION,
|
| 261 |
"WIC": WIC_DESCRIPTION,
|
| 262 |
"FAQ": FAQ_DESCRIPTION,
|
| 263 |
"LS": LS_DESCRIPTION,
|
| 264 |
"SU": SU_DESCRIPTION,
|
| 265 |
+
"NER-E3C": NER_DESCRIPTION,
|
| 266 |
+
"REL-E3C": REL_DESCRIPTION,
|
| 267 |
+
"NER-PHA": NER_PHARMAER_DESCRIPTION,
|
| 268 |
}
|