File size: 1,210 Bytes
3df5153
 
3d1b0c5
3df5153
 
3d1b0c5
 
3df5153
33cdb30
3d1b0c5
 
94b05f0
3df5153
3d1b0c5
 
 
 
3df5153
3d1b0c5
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
import gradio as gr
import json
import os
import requests

from mistral_hf_wrapper import MistralInference
from agent import solve_task, load_tasks

API_URL = os.getenv("HF_MISTRAL_ENDPOINT")
API_TOKEN = os.getenv("HF_TOKEN")
USERNAME = os.getenv("HF_USERNAME")
CODE_LINK = os.getenv("HF_CODE_LINK")

def run_and_submit_all():
    model = MistralInference(api_url=API_URL, api_token=API_TOKEN)
    tasks = load_tasks()
    answers = []

    for task in tasks:
        try:
            answer = solve_task(task, model)
            answers.append({"task_id": task["task_id"], "submitted_answer": answer.strip()})
        except Exception as e:
            answers.append({"task_id": task["task_id"], "submitted_answer": f"ERROR: {str(e)}"})

    res = requests.post(
        "https://agents-course-unit4-scoring.hf.space/submit",
        headers={"Content-Type": "application/json"},
        json={"username": USERNAME, "agent_code": CODE_LINK, "answers": answers},
    )

    if res.ok:
        return json.dumps(res.json(), indent=2)
    return f"Error submitting: {res.status_code} - {res.text}"

gr.Interface(run_and_submit_all, inputs=[], outputs="textbox", title="GAIA Benchmark Agent Submission").launch()