Sfarzi commited on
Commit
5bbb459
ยท
1 Parent(s): e6c5ca5

Initial clone with modifications

Browse files
src/__pycache__/tasks.cpython-310.pyc CHANGED
Binary files a/src/__pycache__/tasks.cpython-310.pyc and b/src/__pycache__/tasks.cpython-310.pyc differ
 
src/about.py CHANGED
@@ -139,8 +139,8 @@ TITLE = """<h1 align="center" id="space-title">๐Ÿš€ ECREAM-LLM Leaderboard ๐Ÿš€<
139
  # What does your leaderboard evaluate?
140
  INTRODUCTION_TEXT = """
141
  <br><br><b>The eCream-LLM leaderboard </b>, developed within <a href='https://ecreamproject.eu/'> the eCream Project </a> (enabling Clinical Research in Emergency and Acute care Medicine), is designed to evaluate Large Language Models (LLMs) on several tasks pertaining to the medical domain. Its distinguishing features are:<b> <br> (i) all tasks are implemented for six languages including English, Italian, Slovak, Slovenian, Polish and Greek; <br> (ii) the leaderboard includes generative tasks, allowing for a more natural interaction with LLMs; <br> (iii) all tasks are evaluated against multiple prompts, this way mitigating the model sensitivity to specific prompts and allowing a fairer evaluation.</b>
142
- <br><br>**<small>Generative tasks:</small>** <small> ๐Ÿท๏ธNER (Named Entity Recognition), ๐Ÿ”—REL (Relation Extraction), ๐Ÿ˜ƒRML(CRF RML) </small>
143
- <br>**<small>Multiple-choice task:</small>** <small> ๐ŸฅDIA (CRF Diagnosis), ๐Ÿ“HIS (CRF History) </small>
144
 
145
  """
146
 
 
139
  # What does your leaderboard evaluate?
140
  INTRODUCTION_TEXT = """
141
  <br><br><b>The eCream-LLM leaderboard </b>, developed within <a href='https://ecreamproject.eu/'> the eCream Project </a> (enabling Clinical Research in Emergency and Acute care Medicine), is designed to evaluate Large Language Models (LLMs) on several tasks pertaining to the medical domain. Its distinguishing features are:<b> <br> (i) all tasks are implemented for six languages including English, Italian, Slovak, Slovenian, Polish and Greek; <br> (ii) the leaderboard includes generative tasks, allowing for a more natural interaction with LLMs; <br> (iii) all tasks are evaluated against multiple prompts, this way mitigating the model sensitivity to specific prompts and allowing a fairer evaluation.</b>
142
+ <br><br>**<small>Generative tasks:</small>** <small> ๐Ÿท๏ธNER-E3C (Named Entity Recognition - E3C), ๐Ÿ”—REL-E3C (Relation Extraction -E3C), ๐Ÿ˜ƒCRF-RML(CRF RML), NER-PHA ( Named Entity Recognition - PharamaER.IT) </small>
143
+ <br>**<small>Multiple-choice task:</small>** <small> ๐ŸฅCRF-DIA (CRF Diagnosis), ๐Ÿ“CRF-HIS (CRF History) </small>
144
 
145
  """
146
 
src/tasks.py CHANGED
@@ -254,15 +254,15 @@ NER_PHARMAER_DESCRIPTION = """### Named Entity Recognition over (NER) over Pha
254
 
255
  # Create a dictionary to map task names to their descriptions
256
  TASK_DESCRIPTIONS = {
257
- "RML-CRF": RML_DESCRIPTION,
258
- "DIA-CRF": DIA_DESCRIPTION,
259
- "HIS-CRF": HIS_DESCRIPTION,
260
  "AT": AT_DESCRIPTION,
261
  "WIC": WIC_DESCRIPTION,
262
  "FAQ": FAQ_DESCRIPTION,
263
  "LS": LS_DESCRIPTION,
264
  "SU": SU_DESCRIPTION,
265
- "NER": NER_DESCRIPTION,
266
- "REL": REL_DESCRIPTION,
267
- "NER-PHARMAER": NER_PHARMAER_DESCRIPTION,
268
  }
 
254
 
255
  # Create a dictionary to map task names to their descriptions
256
  TASK_DESCRIPTIONS = {
257
+ "CRF-RML": RML_DESCRIPTION,
258
+ "CRF-DIA": DIA_DESCRIPTION,
259
+ "CRF-HIS": HIS_DESCRIPTION,
260
  "AT": AT_DESCRIPTION,
261
  "WIC": WIC_DESCRIPTION,
262
  "FAQ": FAQ_DESCRIPTION,
263
  "LS": LS_DESCRIPTION,
264
  "SU": SU_DESCRIPTION,
265
+ "NER-E3C": NER_DESCRIPTION,
266
+ "REL-E3C": REL_DESCRIPTION,
267
+ "NER-PHA": NER_PHARMAER_DESCRIPTION,
268
  }