Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Gregor Betz
commited on
tasks
Browse files- src/display/about.py +14 -2
src/display/about.py
CHANGED
|
@@ -11,8 +11,19 @@ class Task:
|
|
| 11 |
# Init: to update with your specific keys
|
| 12 |
class Tasks(Enum):
|
| 13 |
# task_key in the json file, metric_key in the json file, name to display in the leaderboard
|
| 14 |
-
task0 = Task("
|
| 15 |
-
task1 = Task("
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 16 |
|
| 17 |
|
| 18 |
# Your leaderboard name
|
|
@@ -46,6 +57,7 @@ prompts = [
|
|
| 46 |
]
|
| 47 |
sampling_params = SamplingParams(temperature=0.8, top_p=0.95)
|
| 48 |
llm = LLM(model="<USER>/<MODEL>")
|
|
|
|
| 49 |
```
|
| 50 |
If this step fails, follow the error messages to debug your model before submitting it. It's likely your model has been improperly uploaded.
|
| 51 |
|
|
|
|
| 11 |
# Init: to update with your specific keys
|
| 12 |
class Tasks(Enum):
|
| 13 |
# task_key in the json file, metric_key in the json file, name to display in the leaderboard
|
| 14 |
+
task0 = Task("logiqa_delta_abs", "delta_abs", "LogiQA Δ")
|
| 15 |
+
task1 = Task("logiqa_delta_rel", "delta_rel", "LogiQA Δ%")
|
| 16 |
+
task2 = Task("logiqa_acc_base", "acc_base", "LogiQA Acc")
|
| 17 |
+
task3 = Task("logiqa_acc_cot", "acc_cot", "LogiQA AccCoT")
|
| 18 |
+
task4 = Task("logiqa2_delta_abs", "delta_abs", "LogiQA2 Δ")
|
| 19 |
+
task5 = Task("logiqa2_delta_rel", "delta_rel", "LogiQA2 Δ%")
|
| 20 |
+
task6 = Task("logiqa2_acc_base", "acc_base", "LogiQA2 Acc")
|
| 21 |
+
task7 = Task("logiqa2_acc_cot", "acc_cot", "LogiQA2 AccCoT")
|
| 22 |
+
|
| 23 |
+
|
| 24 |
+
|
| 25 |
+
|
| 26 |
+
|
| 27 |
|
| 28 |
|
| 29 |
# Your leaderboard name
|
|
|
|
| 57 |
]
|
| 58 |
sampling_params = SamplingParams(temperature=0.8, top_p=0.95)
|
| 59 |
llm = LLM(model="<USER>/<MODEL>")
|
| 60 |
+
outputs = llm.generate(prompts, sampling_params)
|
| 61 |
```
|
| 62 |
If this step fails, follow the error messages to debug your model before submitting it. It's likely your model has been improperly uploaded.
|
| 63 |
|