Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
Commit
·
64f1a6e
1
Parent(s):
ed1fdef
Add a model size filter ✨
Browse files
app.py
CHANGED
|
@@ -294,7 +294,30 @@ def filter_items(df, leaderboard_table, query):
|
|
| 294 |
if AutoEvalColumn.model_type_symbol.name in leaderboard_table.columns:
|
| 295 |
filtered_df = df[(df[AutoEvalColumn.model_type_symbol.name] == query)]
|
| 296 |
else:
|
| 297 |
-
return leaderboard_table.columns
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 298 |
return filtered_df[leaderboard_table.columns]
|
| 299 |
|
| 300 |
def change_tab(query_param):
|
|
@@ -310,6 +333,10 @@ def change_tab(query_param):
|
|
| 310 |
else:
|
| 311 |
return gr.Tabs.update(selected=0)
|
| 312 |
|
|
|
|
|
|
|
|
|
|
|
|
|
| 313 |
|
| 314 |
demo = gr.Blocks(css=custom_css)
|
| 315 |
with demo:
|
|
@@ -332,18 +359,44 @@ with demo:
|
|
| 332 |
show_label=False,
|
| 333 |
elem_id="search-bar",
|
| 334 |
)
|
| 335 |
-
|
| 336 |
-
|
| 337 |
-
|
| 338 |
-
|
| 339 |
-
|
| 340 |
-
|
| 341 |
-
|
| 342 |
-
|
| 343 |
-
|
| 344 |
-
|
| 345 |
-
|
| 346 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 347 |
leaderboard_table = gr.components.Dataframe(
|
| 348 |
value=leaderboard_df[[AutoEvalColumn.model_type_symbol.name, AutoEvalColumn.model.name] + shown_columns.value + [AutoEvalColumn.dummy.name]],
|
| 349 |
headers=[AutoEvalColumn.model_type_symbol.name, AutoEvalColumn.model.name] + shown_columns.value + [AutoEvalColumn.dummy.name],
|
|
@@ -367,8 +420,11 @@ with demo:
|
|
| 367 |
[hidden_leaderboard_table_for_search, leaderboard_table, search_bar],
|
| 368 |
leaderboard_table,
|
| 369 |
)
|
| 370 |
-
|
| 371 |
-
|
|
|
|
|
|
|
|
|
|
| 372 |
with gr.TabItem("📝 About", elem_id="llm-benchmark-tab-table", id=2):
|
| 373 |
gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")
|
| 374 |
|
|
@@ -495,4 +551,4 @@ with demo:
|
|
| 495 |
scheduler = BackgroundScheduler()
|
| 496 |
scheduler.add_job(restart_space, "interval", seconds=3600)
|
| 497 |
scheduler.start()
|
| 498 |
-
demo.queue(concurrency_count=40).launch()
|
|
|
|
| 294 |
if AutoEvalColumn.model_type_symbol.name in leaderboard_table.columns:
|
| 295 |
filtered_df = df[(df[AutoEvalColumn.model_type_symbol.name] == query)]
|
| 296 |
else:
|
| 297 |
+
return filtered_df[leaderboard_table.columns]
|
| 298 |
+
return filtered_df[leaderboard_table.columns]
|
| 299 |
+
|
| 300 |
+
def filter_items_size(df, leaderboard_table, query):
|
| 301 |
+
numeric_intervals = {
|
| 302 |
+
"all": None,
|
| 303 |
+
"< 1B": (0, 1),
|
| 304 |
+
"~3B": (1, 5),
|
| 305 |
+
"~7B": (6, 11),
|
| 306 |
+
"~13B": (12, 15),
|
| 307 |
+
"~35B": (16, 55),
|
| 308 |
+
"60B+": (55, 1000)
|
| 309 |
+
}
|
| 310 |
+
|
| 311 |
+
if query == "all":
|
| 312 |
+
return df[leaderboard_table.columns]
|
| 313 |
+
|
| 314 |
+
numeric_interval = numeric_intervals[query]
|
| 315 |
+
|
| 316 |
+
if AutoEvalColumn.params.name in leaderboard_table.columns:
|
| 317 |
+
params_column = pd.to_numeric(df[AutoEvalColumn.params.name], errors='coerce')
|
| 318 |
+
filtered_df = df[params_column.between(*numeric_interval)]
|
| 319 |
+
else:
|
| 320 |
+
return filtered_df[leaderboard_table.columns]
|
| 321 |
return filtered_df[leaderboard_table.columns]
|
| 322 |
|
| 323 |
def change_tab(query_param):
|
|
|
|
| 333 |
else:
|
| 334 |
return gr.Tabs.update(selected=0)
|
| 335 |
|
| 336 |
+
def update_filter_type(input_type, shown_columns):
|
| 337 |
+
shown_columns.append(AutoEvalColumn.params.name)
|
| 338 |
+
return gr.update(visible=(input_type == 'types')), gr.update(visible=(input_type == 'sizes')), shown_columns
|
| 339 |
+
|
| 340 |
|
| 341 |
demo = gr.Blocks(css=custom_css)
|
| 342 |
with demo:
|
|
|
|
| 359 |
show_label=False,
|
| 360 |
elem_id="search-bar",
|
| 361 |
)
|
| 362 |
+
with gr.Box(elem_id="box-filter"):
|
| 363 |
+
filter_type = gr.Dropdown(
|
| 364 |
+
label="⏚ Filter model",
|
| 365 |
+
choices=["types", "sizes"], value="types",
|
| 366 |
+
interactive=True,
|
| 367 |
+
elem_id="filter_type"
|
| 368 |
+
)
|
| 369 |
+
filter_columns = gr.Radio(
|
| 370 |
+
label="⏚ Filter model types",
|
| 371 |
+
show_label=False,
|
| 372 |
+
choices = [
|
| 373 |
+
"all",
|
| 374 |
+
ModelType.PT.to_str(),
|
| 375 |
+
ModelType.FT.to_str(),
|
| 376 |
+
ModelType.IFT.to_str(),
|
| 377 |
+
ModelType.RL.to_str(),
|
| 378 |
+
],
|
| 379 |
+
value="all",
|
| 380 |
+
elem_id="filter-columns"
|
| 381 |
+
)
|
| 382 |
+
filter_columns_size = gr.Radio(
|
| 383 |
+
label="⏚ Filter model sizes",
|
| 384 |
+
show_label=False,
|
| 385 |
+
choices = [
|
| 386 |
+
"all",
|
| 387 |
+
"< 1B",
|
| 388 |
+
"~3B",
|
| 389 |
+
"~7B",
|
| 390 |
+
"~13B",
|
| 391 |
+
"~35B",
|
| 392 |
+
"60B+"
|
| 393 |
+
],
|
| 394 |
+
value="all",
|
| 395 |
+
visible=False,
|
| 396 |
+
interactive=True,
|
| 397 |
+
elem_id="filter-columns-size"
|
| 398 |
+
)
|
| 399 |
+
|
| 400 |
leaderboard_table = gr.components.Dataframe(
|
| 401 |
value=leaderboard_df[[AutoEvalColumn.model_type_symbol.name, AutoEvalColumn.model.name] + shown_columns.value + [AutoEvalColumn.dummy.name]],
|
| 402 |
headers=[AutoEvalColumn.model_type_symbol.name, AutoEvalColumn.model.name] + shown_columns.value + [AutoEvalColumn.dummy.name],
|
|
|
|
| 420 |
[hidden_leaderboard_table_for_search, leaderboard_table, search_bar],
|
| 421 |
leaderboard_table,
|
| 422 |
)
|
| 423 |
+
|
| 424 |
+
filter_type.change(update_filter_type,inputs=[filter_type, shown_columns],outputs=[filter_columns, filter_columns_size, shown_columns],queue=False).then(select_columns, [hidden_leaderboard_table_for_search, shown_columns], leaderboard_table, queue=False)
|
| 425 |
+
shown_columns.change(select_columns, [hidden_leaderboard_table_for_search, shown_columns], leaderboard_table, queue=False)
|
| 426 |
+
filter_columns.change(filter_items, [hidden_leaderboard_table_for_search, leaderboard_table, filter_columns], leaderboard_table, queue=False)
|
| 427 |
+
filter_columns_size.change(filter_items_size, [hidden_leaderboard_table_for_search, leaderboard_table, filter_columns_size], leaderboard_table, queue=False)
|
| 428 |
with gr.TabItem("📝 About", elem_id="llm-benchmark-tab-table", id=2):
|
| 429 |
gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")
|
| 430 |
|
|
|
|
| 551 |
scheduler = BackgroundScheduler()
|
| 552 |
scheduler.add_job(restart_space, "interval", seconds=3600)
|
| 553 |
scheduler.start()
|
| 554 |
+
demo.queue(concurrency_count=40).launch()
|