File size: 1,964 Bytes
da9fcee
 
decddfb
 
0d4d0a1
c8f728b
 
0d4d0a1
f3dd2c8
4cd6fae
9d7ed12
0fccc5c
4cd6fae
c945f59
 
 
 
8dde8b1
 
c945f59
762c317
c945f59
 
 
71ea75d
ff4b34e
 
71ea75d
 
c945f59
 
 
 
 
 
6156cf9
c945f59
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
import pandas as pd

from openai import OpenAI

FILE_NAME = "data/gaia_validation_20.jsonl"

def get_questions():
    df = pd.read_json(FILE_NAME, lines=True)
    result=[]
    
    for index, row in df.iterrows():
        result.append([row["Level"], row["Question"], row["file_name"], row["Final answer"]])

    return result

def get_final_answer(question, initial_answer):
    prompt_template = """
        You are an expert GAIA benchmark question answering assistant, given a question and an initial answer.
        Your final answer must be a number and/or string OR as few words as possible OR a comma separated list of numbers and/or strings.
        If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise.
        If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise.
        If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string.
        **Question:** """ + question + """
        **Initial answer:** """ + initial_answer + """
        **Example 1:** How many 'r' are in strawberry? 3
        **Example 2:** What is the opposite of white? Black
        **Example 3:** What is the biggest city in California? Los Angeles
        **Example 4:** What is the superlative of good? Best
        **Example 5:** How many states are in the USA? 50
        **Final answer:** 
        """

    client = OpenAI()
    completion = client.chat.completions.create(
        messages=[{"role": "user", "content": [{"type": "text", "text": prompt_template}]}],
        model="gpt-4.5-preview"
    )

    final_answer = completion.choices[0].message.content
    
    print("###")
    print(question)
    print(initial_answer)
    print(final_answer)
    print("###")
    
    return final_answer