Spaces:
Paused
Paused
File size: 1,964 Bytes
da9fcee decddfb 0d4d0a1 c8f728b 0d4d0a1 f3dd2c8 4cd6fae 9d7ed12 0fccc5c 4cd6fae c945f59 8dde8b1 c945f59 762c317 c945f59 71ea75d ff4b34e 71ea75d c945f59 6156cf9 c945f59 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 | import pandas as pd
from openai import OpenAI
FILE_NAME = "data/gaia_validation_20.jsonl"
def get_questions():
df = pd.read_json(FILE_NAME, lines=True)
result=[]
for index, row in df.iterrows():
result.append([row["Level"], row["Question"], row["file_name"], row["Final answer"]])
return result
def get_final_answer(question, initial_answer):
prompt_template = """
You are an expert GAIA benchmark question answering assistant, given a question and an initial answer.
Your final answer must be a number and/or string OR as few words as possible OR a comma separated list of numbers and/or strings.
If you are asked for a number, don't use comma to write your number neither use units such as $ or percent sign unless specified otherwise.
If you are asked for a string, don't use articles, neither abbreviations (e.g. for cities), and write the digits in plain text unless specified otherwise.
If you are asked for a comma separated list, apply the above rules depending of whether the element to be put in the list is a number or a string.
**Question:** """ + question + """
**Initial answer:** """ + initial_answer + """
**Example 1:** How many 'r' are in strawberry? 3
**Example 2:** What is the opposite of white? Black
**Example 3:** What is the biggest city in California? Los Angeles
**Example 4:** What is the superlative of good? Best
**Example 5:** How many states are in the USA? 50
**Final answer:**
"""
client = OpenAI()
completion = client.chat.completions.create(
messages=[{"role": "user", "content": [{"type": "text", "text": prompt_template}]}],
model="gpt-4.5-preview"
)
final_answer = completion.choices[0].message.content
print("###")
print(question)
print(initial_answer)
print(final_answer)
print("###")
return final_answer |