FD900 commited on
Commit
55c26dd
·
verified ·
1 Parent(s): c263de5

Update gaia_benchmark/run.py

Browse files
Files changed (1) hide show
  1. gaia_benchmark/run.py +4 -4
gaia_benchmark/run.py CHANGED
@@ -1,10 +1,10 @@
1
- from gaia_benchmark.questions import get_all_questions
2
- from gaia_benchmark.gaia_interface import submit_to_leaderboard
3
 
4
  def run_and_submit_all(agent):
5
  questions = get_all_questions()
6
  answers = []
7
  for q in questions:
8
- answer = agent(q["question"])
9
  answers.append({"question_id": q["id"], "answer": answer})
10
- return submit_to_leaderboard(answers)
 
1
+ from questions import get_all_questions
2
+ from gaia_interface import submit_to_leaderboard # Adjust path if needed
3
 
4
  def run_and_submit_all(agent):
5
  questions = get_all_questions()
6
  answers = []
7
  for q in questions:
8
+ answer = agent(q) # Pass entire dict, not q["question"]
9
  answers.append({"question_id": q["id"], "answer": answer})
10
+ return submit_to_leaderboard(answers)