Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Import contants as submodule
Browse files- app.py +5 -5
- src/details.py +4 -4
- src/results.py +5 -5
app.py
CHANGED
|
@@ -2,7 +2,7 @@ from functools import partial
|
|
| 2 |
|
| 3 |
import gradio as gr
|
| 4 |
|
| 5 |
-
|
| 6 |
from src.details import update_subtasks_component, update_load_details_component, load_details_dataframes, \
|
| 7 |
display_details, update_sample_idx_component, clear_details, update_task_description_component
|
| 8 |
from src.results import update_load_results_component, \
|
|
@@ -34,7 +34,7 @@ with gr.Blocks(fill_height=True, fill_width=True) as demo:
|
|
| 34 |
load_results_btn = gr.Button("Load", interactive=False)
|
| 35 |
clear_results_btn = gr.Button("Clear")
|
| 36 |
results_task = gr.Radio(
|
| 37 |
-
["All"] + list(TASKS.values()),
|
| 38 |
label="Tasks",
|
| 39 |
info="Evaluation tasks to be displayed",
|
| 40 |
value="All",
|
|
@@ -50,7 +50,7 @@ with gr.Blocks(fill_height=True, fill_width=True) as demo:
|
|
| 50 |
load_configs_btn = gr.Button("Load", interactive=False)
|
| 51 |
clear_configs_btn = gr.Button("Clear")
|
| 52 |
configs_task = gr.Radio(
|
| 53 |
-
["All"] + list(TASKS.values()),
|
| 54 |
label="Tasks",
|
| 55 |
info="Evaluation tasks to be displayed",
|
| 56 |
value="All",
|
|
@@ -64,7 +64,7 @@ with gr.Blocks(fill_height=True, fill_width=True) as demo:
|
|
| 64 |
configs = gr.HTML()
|
| 65 |
with gr.Tab("Details"):
|
| 66 |
details_task = gr.Radio(
|
| 67 |
-
list(value for value in TASKS.values() if value[1] != "leaderboard_gpqa"),
|
| 68 |
label="Tasks",
|
| 69 |
info="Evaluation tasks to be loaded",
|
| 70 |
interactive=True,
|
|
@@ -74,7 +74,7 @@ with gr.Blocks(fill_height=True, fill_width=True) as demo:
|
|
| 74 |
lines=3,
|
| 75 |
)
|
| 76 |
subtask = gr.Radio(
|
| 77 |
-
SUBTASKS.get(details_task.value),
|
| 78 |
label="Subtasks",
|
| 79 |
info="Evaluation subtasks to be loaded (choose one of the Tasks above)",
|
| 80 |
)
|
|
|
|
| 2 |
|
| 3 |
import gradio as gr
|
| 4 |
|
| 5 |
+
import src.constants as constants
|
| 6 |
from src.details import update_subtasks_component, update_load_details_component, load_details_dataframes, \
|
| 7 |
display_details, update_sample_idx_component, clear_details, update_task_description_component
|
| 8 |
from src.results import update_load_results_component, \
|
|
|
|
| 34 |
load_results_btn = gr.Button("Load", interactive=False)
|
| 35 |
clear_results_btn = gr.Button("Clear")
|
| 36 |
results_task = gr.Radio(
|
| 37 |
+
["All"] + list(constants.TASKS.values()),
|
| 38 |
label="Tasks",
|
| 39 |
info="Evaluation tasks to be displayed",
|
| 40 |
value="All",
|
|
|
|
| 50 |
load_configs_btn = gr.Button("Load", interactive=False)
|
| 51 |
clear_configs_btn = gr.Button("Clear")
|
| 52 |
configs_task = gr.Radio(
|
| 53 |
+
["All"] + list(constants.TASKS.values()),
|
| 54 |
label="Tasks",
|
| 55 |
info="Evaluation tasks to be displayed",
|
| 56 |
value="All",
|
|
|
|
| 64 |
configs = gr.HTML()
|
| 65 |
with gr.Tab("Details"):
|
| 66 |
details_task = gr.Radio(
|
| 67 |
+
list(value for value in constants.TASKS.values() if value[1] != "leaderboard_gpqa"),
|
| 68 |
label="Tasks",
|
| 69 |
info="Evaluation tasks to be loaded",
|
| 70 |
interactive=True,
|
|
|
|
| 74 |
lines=3,
|
| 75 |
)
|
| 76 |
subtask = gr.Radio(
|
| 77 |
+
# constants.SUBTASKS.get(details_task.value),
|
| 78 |
label="Subtasks",
|
| 79 |
info="Evaluation subtasks to be loaded (choose one of the Tasks above)",
|
| 80 |
)
|
src/details.py
CHANGED
|
@@ -4,13 +4,13 @@ import gradio as gr
|
|
| 4 |
import pandas as pd
|
| 5 |
from huggingface_hub import HfFileSystem
|
| 6 |
|
| 7 |
-
|
| 8 |
from src.hub import load_details_file
|
| 9 |
|
| 10 |
|
| 11 |
def update_task_description_component(task):
|
| 12 |
return gr.Textbox(
|
| 13 |
-
TASK_DESCRIPTIONS.get(task),
|
| 14 |
label="Task Description",
|
| 15 |
lines=3,
|
| 16 |
visible=True,
|
|
@@ -19,7 +19,7 @@ def update_task_description_component(task):
|
|
| 19 |
|
| 20 |
def update_subtasks_component(task):
|
| 21 |
return gr.Radio(
|
| 22 |
-
SUBTASKS.get(task),
|
| 23 |
info="Evaluation subtasks to be loaded",
|
| 24 |
value=None,
|
| 25 |
)
|
|
@@ -38,7 +38,7 @@ async def load_details_dataframe(model_id, subtask):
|
|
| 38 |
return
|
| 39 |
model_name_sanitized = model_id.replace("/", "__")
|
| 40 |
paths = fs.glob(
|
| 41 |
-
f"{DETAILS_DATASET_ID}/**/{DETAILS_FILENAME}".format(
|
| 42 |
model_name_sanitized=model_name_sanitized, subtask=subtask
|
| 43 |
)
|
| 44 |
)
|
|
|
|
| 4 |
import pandas as pd
|
| 5 |
from huggingface_hub import HfFileSystem
|
| 6 |
|
| 7 |
+
import src.constants as constants
|
| 8 |
from src.hub import load_details_file
|
| 9 |
|
| 10 |
|
| 11 |
def update_task_description_component(task):
|
| 12 |
return gr.Textbox(
|
| 13 |
+
constants.TASK_DESCRIPTIONS.get(task),
|
| 14 |
label="Task Description",
|
| 15 |
lines=3,
|
| 16 |
visible=True,
|
|
|
|
| 19 |
|
| 20 |
def update_subtasks_component(task):
|
| 21 |
return gr.Radio(
|
| 22 |
+
constants.SUBTASKS.get(task),
|
| 23 |
info="Evaluation subtasks to be loaded",
|
| 24 |
value=None,
|
| 25 |
)
|
|
|
|
| 38 |
return
|
| 39 |
model_name_sanitized = model_id.replace("/", "__")
|
| 40 |
paths = fs.glob(
|
| 41 |
+
f"{constants.DETAILS_DATASET_ID}/**/{constants.DETAILS_FILENAME}".format(
|
| 42 |
model_name_sanitized=model_name_sanitized, subtask=subtask
|
| 43 |
)
|
| 44 |
)
|
src/results.py
CHANGED
|
@@ -5,13 +5,13 @@ import numpy as np
|
|
| 5 |
import pandas as pd
|
| 6 |
from huggingface_hub import HfFileSystem
|
| 7 |
|
| 8 |
-
|
| 9 |
from src.hub import load_file
|
| 10 |
|
| 11 |
|
| 12 |
def fetch_result_paths():
|
| 13 |
fs = HfFileSystem()
|
| 14 |
-
paths = fs.glob(f"{RESULTS_DATASET_ID}/**/**/*.json")
|
| 15 |
return paths
|
| 16 |
|
| 17 |
|
|
@@ -20,7 +20,7 @@ def sort_result_paths_per_model(paths):
|
|
| 20 |
|
| 21 |
d = defaultdict(list)
|
| 22 |
for path in paths:
|
| 23 |
-
model_id, _ = path[len(RESULTS_DATASET_ID) + 1:].rsplit("/", 1)
|
| 24 |
d[model_id].append(path)
|
| 25 |
return {model_id: sorted(paths) for model_id, paths in d.items()}
|
| 26 |
|
|
@@ -82,7 +82,7 @@ def display_tab(tab, df, task):
|
|
| 82 |
def update_tasks_component():
|
| 83 |
return (
|
| 84 |
gr.Radio(
|
| 85 |
-
["All"] + list(TASKS.values()),
|
| 86 |
label="Tasks",
|
| 87 |
info="Evaluation tasks to be displayed",
|
| 88 |
value="All",
|
|
@@ -98,7 +98,7 @@ def clear_results():
|
|
| 98 |
*(gr.Button("Load", interactive=False), ) * 2,
|
| 99 |
*(
|
| 100 |
gr.Radio(
|
| 101 |
-
["All"] + list(TASKS.values()),
|
| 102 |
label="Tasks",
|
| 103 |
info="Evaluation tasks to be displayed",
|
| 104 |
value="All",
|
|
|
|
| 5 |
import pandas as pd
|
| 6 |
from huggingface_hub import HfFileSystem
|
| 7 |
|
| 8 |
+
import src.constants as constants
|
| 9 |
from src.hub import load_file
|
| 10 |
|
| 11 |
|
| 12 |
def fetch_result_paths():
|
| 13 |
fs = HfFileSystem()
|
| 14 |
+
paths = fs.glob(f"{constants.RESULTS_DATASET_ID}/**/**/*.json")
|
| 15 |
return paths
|
| 16 |
|
| 17 |
|
|
|
|
| 20 |
|
| 21 |
d = defaultdict(list)
|
| 22 |
for path in paths:
|
| 23 |
+
model_id, _ = path[len(constants.RESULTS_DATASET_ID) + 1:].rsplit("/", 1)
|
| 24 |
d[model_id].append(path)
|
| 25 |
return {model_id: sorted(paths) for model_id, paths in d.items()}
|
| 26 |
|
|
|
|
| 82 |
def update_tasks_component():
|
| 83 |
return (
|
| 84 |
gr.Radio(
|
| 85 |
+
["All"] + list(constants.TASKS.values()),
|
| 86 |
label="Tasks",
|
| 87 |
info="Evaluation tasks to be displayed",
|
| 88 |
value="All",
|
|
|
|
| 98 |
*(gr.Button("Load", interactive=False), ) * 2,
|
| 99 |
*(
|
| 100 |
gr.Radio(
|
| 101 |
+
["All"] + list(constants.TASKS.values()),
|
| 102 |
label="Tasks",
|
| 103 |
info="Evaluation tasks to be displayed",
|
| 104 |
value="All",
|