FD900's picture
Update app.py
924b7fa verified
raw
history blame
398 Bytes
import gradio as gr
from agent import GaiaAgent
from gaia_benchmark.run import run_and_submit_all
agent = GaiaAgent()
with gr.Blocks() as demo:
gr.Markdown("# GAIA Agent Evaluation")
btn = gr.Button("Run Evaluation & Submit All Answers")
result = gr.Textbox(label="Submission Result")
btn.click(fn=lambda: run_and_submit_all(agent.answer_question), outputs=result)
demo.launch()