Spaces:

MBZUAI-LLM
/

Mobile-MMLU-Challenge

Running

SondosMB commited on Dec 20, 2024

Commit

1f0c8bc

verified ·

1 Parent(s): 3b1c26f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -308,19 +308,23 @@ def evaluate_predictions(prediction_file, model_name, add_to_leaderboard):
         return f"Error during evaluation: {str(e)}", load_leaderboard()
 initialize_leaderboard_file()
 with gr.Blocks() as demo:
     gr.Markdown("""
         # Competition Title
         ### Welcome to the Competition Overview
         ![Competition Logo](Mobile-MMLU2_.pdf)
         Here you can submit your predictions, view the leaderboard, and track your performance!
     """)
     with gr.Tabs():
         with gr.TabItem("📖 Overview"):
             gr.Markdown("""
-                ## Overview
-                # Welcome to the Mobile-MMLU Benchmark Competition
 Evaluate the performance of mobile-compatible Large Language Models (LLMs) on 16,186 scenario-based and factual questions across 80 fields. Compete to showcase your model’s accuracy for real-world mobile scenarios.
@@ -380,7 +384,7 @@ For questions or support, contact us at: [Insert Email Address]
                 model_name_input = gr.Textbox(label="Model Name", placeholder="Enter your model name")
             with gr.Row():
-                overall_accuracy_display = gr.Textbox(label="Overall Accuracy", interactive=False)
                 add_to_leaderboard_checkbox = gr.Checkbox(label="Add to Leaderboard?", value=True)
             eval_button = gr.Button("Evaluate")

         return f"Error during evaluation: {str(e)}", load_leaderboard()
 initialize_leaderboard_file()
 with gr.Blocks() as demo:
     gr.Markdown("""
         # Competition Title
         ### Welcome to the Competition Overview
+        <iframe src="Mobile-MMLU2_.pdf" width="100%" height="500px"></iframe>
         ![Competition Logo](Mobile-MMLU2_.pdf)
         Here you can submit your predictions, view the leaderboard, and track your performance!
     """)
     with gr.Tabs():
         with gr.TabItem("📖 Overview"):
             gr.Markdown("""
+## Overview
+# Welcome to the Mobile-MMLU Benchmark Competition
 Evaluate the performance of mobile-compatible Large Language Models (LLMs) on 16,186 scenario-based and factual questions across 80 fields. Compete to showcase your model’s accuracy for real-world mobile scenarios.
                 model_name_input = gr.Textbox(label="Model Name", placeholder="Enter your model name")
             with gr.Row():
+                overall_accuracy_display = gr.Number(label="Overall Accuracy", interactive=False)
                 add_to_leaderboard_checkbox = gr.Checkbox(label="Add to Leaderboard?", value=True)
             eval_button = gr.Button("Evaluate")