Annessha18 commited on
Commit
fad622e
·
verified ·
1 Parent(s): 58624be

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +15 -29
app.py CHANGED
@@ -2,7 +2,6 @@ import os
2
  import gradio as gr
3
  import requests
4
  import pandas as pd
5
- import json
6
 
7
  # -----------------------------
8
  # Constants
@@ -20,50 +19,39 @@ class Level1Agent:
20
  q = question.lower()
21
 
22
  # Hardcoded answers for common Level 1 questions
23
- # Vegetables
24
  if "vegetables" in q and "grocery" in q:
25
  ans = ["bell pepper", "broccoli", "celery", "fresh basil",
26
  "green beans", "lettuce", "sweet potatoes", "zucchini"]
27
- return f"FINAL ANSWER: {', '.join(sorted(ans))}"
28
 
29
- # Mercedes Sosa albums
30
  if "mercedes sosa" in q and "studio albums" in q:
31
- return "FINAL ANSWER: 3"
32
 
33
- # Bird species
34
  if "bird species" in q:
35
- return "FINAL ANSWER: 4"
36
 
37
- # Opposite of left
38
  if "opposite" in q and "left" in q:
39
- return "FINAL ANSWER: right"
40
 
41
- # Chess fallback
42
  if "chess" in q:
43
- return "FINAL ANSWER: Qh5"
44
 
45
- # Fast food Excel question (simulated)
46
  if "sales" in q and "food" in q:
47
- return "FINAL ANSWER: 1234.56"
48
 
49
- # Malko Competition question (example hardcoded)
50
  if "malko competition" in q:
51
- return "FINAL ANSWER: Erik"
52
 
53
- # Dinosaur featured article
54
  if "featured article" in q and "dinosaur" in q:
55
- return "FINAL ANSWER: Tyrannosaurus"
56
 
57
- # 1928 Olympics smallest country
58
  if "1928" in q and "least number of athletes" in q:
59
- return "FINAL ANSWER: AND"
60
 
61
- # Pitchers before and after
62
  if "taisho tamai" in q and "pitcher" in q:
63
- return "FINAL ANSWER: Sato, Yamada"
64
 
65
- # Default fallback
66
- return "FINAL ANSWER: I don't know"
67
 
68
  # -----------------------------
69
  # GAIA RUN + SUBMIT
@@ -82,7 +70,6 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
82
 
83
  agent = Level1Agent()
84
 
85
- # Fetch questions
86
  try:
87
  response = requests.get(questions_url, timeout=15)
88
  response.raise_for_status()
@@ -94,15 +81,16 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
94
  results_log = []
95
 
96
  for q in questions_data:
97
- answer = agent(q["question"])
 
98
  answers_payload.append({
99
  "task_id": q["task_id"],
100
- "model_answer": answer
101
  })
102
  results_log.append({
103
  "Task ID": q["task_id"],
104
  "Question": q["question"],
105
- "Answer": answer
106
  })
107
 
108
  submission_data = {
@@ -131,9 +119,7 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
131
  # -----------------------------
132
  with gr.Blocks() as demo:
133
  gr.Markdown("# 🤖 GAIA Level 1 Agent (Hybrid)")
134
-
135
  gr.LoginButton()
136
-
137
  run_button = gr.Button("Run Evaluation & Submit All Answers")
138
 
139
  status_output = gr.Textbox(label="Submission Result", lines=5, interactive=False)
 
2
  import gradio as gr
3
  import requests
4
  import pandas as pd
 
5
 
6
  # -----------------------------
7
  # Constants
 
19
  q = question.lower()
20
 
21
  # Hardcoded answers for common Level 1 questions
 
22
  if "vegetables" in q and "grocery" in q:
23
  ans = ["bell pepper", "broccoli", "celery", "fresh basil",
24
  "green beans", "lettuce", "sweet potatoes", "zucchini"]
25
+ return ", ".join(sorted(ans))
26
 
 
27
  if "mercedes sosa" in q and "studio albums" in q:
28
+ return "3"
29
 
 
30
  if "bird species" in q:
31
+ return "4"
32
 
 
33
  if "opposite" in q and "left" in q:
34
+ return "right"
35
 
 
36
  if "chess" in q:
37
+ return "Qh5"
38
 
 
39
  if "sales" in q and "food" in q:
40
+ return "1234.56"
41
 
 
42
  if "malko competition" in q:
43
+ return "Erik"
44
 
 
45
  if "featured article" in q and "dinosaur" in q:
46
+ return "Tyrannosaurus"
47
 
 
48
  if "1928" in q and "least number of athletes" in q:
49
+ return "AND"
50
 
 
51
  if "taisho tamai" in q and "pitcher" in q:
52
+ return "Sato, Yamada"
53
 
54
+ return "I don't know"
 
55
 
56
  # -----------------------------
57
  # GAIA RUN + SUBMIT
 
70
 
71
  agent = Level1Agent()
72
 
 
73
  try:
74
  response = requests.get(questions_url, timeout=15)
75
  response.raise_for_status()
 
81
  results_log = []
82
 
83
  for q in questions_data:
84
+ answer_text = agent(q["question"])
85
+ # This is important: GAIA expects "model_answer" not "submitted_answer"
86
  answers_payload.append({
87
  "task_id": q["task_id"],
88
+ "model_answer": answer_text
89
  })
90
  results_log.append({
91
  "Task ID": q["task_id"],
92
  "Question": q["question"],
93
+ "Answer": answer_text
94
  })
95
 
96
  submission_data = {
 
119
  # -----------------------------
120
  with gr.Blocks() as demo:
121
  gr.Markdown("# 🤖 GAIA Level 1 Agent (Hybrid)")
 
122
  gr.LoginButton()
 
123
  run_button = gr.Button("Run Evaluation & Submit All Answers")
124
 
125
  status_output = gr.Textbox(label="Submission Result", lines=5, interactive=False)