abdul4rehman215 commited on
Commit
08b68d6
·
verified ·
1 Parent(s): 81917a3

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +255 -94
app.py CHANGED
@@ -1,34 +1,231 @@
1
  import os
 
 
 
 
 
 
 
2
  import gradio as gr
3
  import requests
4
- import inspect
5
  import pandas as pd
 
6
 
7
- # (Keep Constants as is)
8
  # --- Constants ---
9
  DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
10
 
11
- # --- Basic Agent Definition ---
12
- # ----- THIS IS WERE YOU CAN BUILD WHAT YOU WANT ------
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
13
  class BasicAgent:
14
  def __init__(self):
 
 
 
 
15
  print("BasicAgent initialized.")
16
- def __call__(self, question: str) -> str:
17
- print(f"Agent received question (first 50 chars): {question[:50]}...")
18
- fixed_answer = "This is a default answer."
19
- print(f"Agent returning fixed answer: {fixed_answer}")
20
- return fixed_answer
21
 
22
- def run_and_submit_all( profile: gr.OAuthProfile | None):
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
23
  """
24
  Fetches all questions, runs the BasicAgent on them, submits all answers,
25
  and displays the results.
26
  """
27
- # --- Determine HF Space Runtime URL and Repo URL ---
28
- space_id = os.getenv("SPACE_ID") # Get the SPACE_ID for sending link to the code
29
 
30
  if profile:
31
- username= f"{profile.username}"
32
  print(f"User logged in: {username}")
33
  else:
34
  print("User not logged in.")
@@ -38,70 +235,73 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
38
  questions_url = f"{api_url}/questions"
39
  submit_url = f"{api_url}/submit"
40
 
41
- # 1. Instantiate Agent ( modify this part to create your agent)
42
  try:
43
  agent = BasicAgent()
44
  except Exception as e:
45
  print(f"Error instantiating agent: {e}")
46
  return f"Error initializing agent: {e}", None
47
- # In the case of an app running as a hugging Face space, this link points toward your codebase ( usefull for others so please keep it public)
48
  agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main"
49
  print(agent_code)
50
 
51
- # 2. Fetch Questions
52
  print(f"Fetching questions from: {questions_url}")
53
  try:
54
- response = requests.get(questions_url, timeout=15)
55
  response.raise_for_status()
56
  questions_data = response.json()
57
  if not questions_data:
58
- print("Fetched questions list is empty.")
59
- return "Fetched questions list is empty or invalid format.", None
60
  print(f"Fetched {len(questions_data)} questions.")
61
- except requests.exceptions.RequestException as e:
62
- print(f"Error fetching questions: {e}")
63
- return f"Error fetching questions: {e}", None
64
- except requests.exceptions.JSONDecodeError as e:
65
- print(f"Error decoding JSON response from questions endpoint: {e}")
66
- print(f"Response text: {response.text[:500]}")
67
- return f"Error decoding server response for questions: {e}", None
68
  except Exception as e:
69
- print(f"An unexpected error occurred fetching questions: {e}")
70
- return f"An unexpected error occurred fetching questions: {e}", None
71
 
72
- # 3. Run your Agent
73
  results_log = []
74
  answers_payload = []
 
75
  print(f"Running agent on {len(questions_data)} questions...")
76
  for item in questions_data:
77
  task_id = item.get("task_id")
78
  question_text = item.get("question")
79
  if not task_id or question_text is None:
80
- print(f"Skipping item with missing task_id or question: {item}")
81
  continue
 
82
  try:
83
- submitted_answer = agent(question_text)
84
- answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
85
- results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
 
 
 
 
 
 
 
 
86
  except Exception as e:
87
- print(f"Error running agent on task {task_id}: {e}")
88
- results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": f"AGENT ERROR: {e}"})
 
 
 
 
 
89
 
90
  if not answers_payload:
91
- print("Agent did not produce any answers to submit.")
92
  return "Agent did not produce any answers to submit.", pd.DataFrame(results_log)
93
 
94
- # 4. Prepare Submission
95
- submission_data = {"username": username.strip(), "agent_code": agent_code, "answers": answers_payload}
96
- status_update = f"Agent finished. Submitting {len(answers_payload)} answers for user '{username}'..."
97
- print(status_update)
 
98
 
99
- # 5. Submit
100
  print(f"Submitting {len(answers_payload)} answers to: {submit_url}")
101
  try:
102
- response = requests.post(submit_url, json=submission_data, timeout=60)
103
  response.raise_for_status()
104
  result_data = response.json()
 
105
  final_status = (
106
  f"Submission Successful!\n"
107
  f"User: {result_data.get('username')}\n"
@@ -109,61 +309,43 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
109
  f"({result_data.get('correct_count', '?')}/{result_data.get('total_attempted', '?')} correct)\n"
110
  f"Message: {result_data.get('message', 'No message received.')}"
111
  )
112
- print("Submission successful.")
113
  results_df = pd.DataFrame(results_log)
114
  return final_status, results_df
 
115
  except requests.exceptions.HTTPError as e:
116
  error_detail = f"Server responded with status {e.response.status_code}."
117
  try:
118
  error_json = e.response.json()
119
  error_detail += f" Detail: {error_json.get('detail', e.response.text)}"
120
- except requests.exceptions.JSONDecodeError:
121
  error_detail += f" Response: {e.response.text[:500]}"
122
- status_message = f"Submission Failed: {error_detail}"
123
- print(status_message)
124
- results_df = pd.DataFrame(results_log)
125
- return status_message, results_df
126
  except requests.exceptions.Timeout:
127
- status_message = "Submission Failed: The request timed out."
128
- print(status_message)
129
- results_df = pd.DataFrame(results_log)
130
- return status_message, results_df
131
  except requests.exceptions.RequestException as e:
132
- status_message = f"Submission Failed: Network error - {e}"
133
- print(status_message)
134
- results_df = pd.DataFrame(results_log)
135
- return status_message, results_df
136
  except Exception as e:
137
- status_message = f"An unexpected error occurred during submission: {e}"
138
- print(status_message)
139
- results_df = pd.DataFrame(results_log)
140
- return status_message, results_df
141
 
142
 
143
- # --- Build Gradio Interface using Blocks ---
144
  with gr.Blocks() as demo:
145
  gr.Markdown("# Basic Agent Evaluation Runner")
146
  gr.Markdown(
147
  """
148
  **Instructions:**
149
-
150
- 1. Please clone this space, then modify the code to define your agent's logic, the tools, the necessary packages, etc ...
151
- 2. Log in to your Hugging Face account using the button below. This uses your HF username for submission.
152
- 3. Click 'Run Evaluation & Submit All Answers' to fetch questions, run your agent, submit answers, and see the score.
153
-
154
- ---
155
- **Disclaimers:**
156
- Once clicking on the "submit button, it can take quite some time ( this is the time for the agent to go through all the questions).
157
- This space provides a basic setup and is intentionally sub-optimal to encourage you to develop your own, more robust solution. For instance for the delay process of the submit button, a solution could be to cache the answers and submit in a seperate action or even to answer the questions in async.
158
  """
159
  )
160
 
161
  gr.LoginButton()
162
-
163
  run_button = gr.Button("Run Evaluation & Submit All Answers")
164
-
165
  status_output = gr.Textbox(label="Run Status / Submission Result", lines=5, interactive=False)
166
- # Removed max_rows=10 from DataFrame constructor
167
  results_table = gr.DataFrame(label="Questions and Agent Answers", wrap=True)
168
 
169
  run_button.click(
@@ -172,25 +354,4 @@ with gr.Blocks() as demo:
172
  )
173
 
174
  if __name__ == "__main__":
175
- print("\n" + "-"*30 + " App Starting " + "-"*30)
176
- # Check for SPACE_HOST and SPACE_ID at startup for information
177
- space_host_startup = os.getenv("SPACE_HOST")
178
- space_id_startup = os.getenv("SPACE_ID") # Get SPACE_ID at startup
179
-
180
- if space_host_startup:
181
- print(f"✅ SPACE_HOST found: {space_host_startup}")
182
- print(f" Runtime URL should be: https://{space_host_startup}.hf.space")
183
- else:
184
- print("ℹ️ SPACE_HOST environment variable not found (running locally?).")
185
-
186
- if space_id_startup: # Print repo URLs if SPACE_ID is found
187
- print(f"✅ SPACE_ID found: {space_id_startup}")
188
- print(f" Repo URL: https://huggingface.co/spaces/{space_id_startup}")
189
- print(f" Repo Tree URL: https://huggingface.co/spaces/{space_id_startup}/tree/main")
190
- else:
191
- print("ℹ️ SPACE_ID environment variable not found (running locally?). Repo URL cannot be determined.")
192
-
193
- print("-"*(60 + len(" App Starting ")) + "\n")
194
-
195
- print("Launching Gradio Interface for Basic Agent Evaluation...")
196
  demo.launch(debug=True, share=False)
 
1
  import os
2
+ import re
3
+ import io
4
+ import base64
5
+ import mimetypes
6
+ import tempfile
7
+ from pathlib import Path
8
+
9
  import gradio as gr
10
  import requests
 
11
  import pandas as pd
12
+ from openai import OpenAI
13
 
 
14
  # --- Constants ---
15
  DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
16
 
17
+ # Set these in your Space Secrets:
18
+ # LLM_API_KEY -> your API key
19
+ # LLM_BASE_URL -> optional, for OpenAI-compatible providers
20
+ # MODEL_NAME -> e.g. gpt-4o-mini or another strong model
21
+ # TRANSCRIBE_MODEL -> e.g. gpt-4o-mini-transcribe
22
+ LLM_API_KEY = os.getenv("LLM_API_KEY", "")
23
+ LLM_BASE_URL = os.getenv("LLM_BASE_URL", "https://api.openai.com/v1")
24
+ MODEL_NAME = os.getenv("MODEL_NAME", "gpt-4o-mini")
25
+ TRANSCRIBE_MODEL = os.getenv("TRANSCRIBE_MODEL", "gpt-4o-mini-transcribe")
26
+
27
+
28
+ def to_data_url(file_path: str) -> str:
29
+ mime, _ = mimetypes.guess_type(file_path)
30
+ if not mime:
31
+ mime = "application/octet-stream"
32
+ with open(file_path, "rb") as f:
33
+ b64 = base64.b64encode(f.read()).decode("utf-8")
34
+ return f"data:{mime};base64,{b64}"
35
+
36
+
37
+ def clean_final_answer(text: str) -> str:
38
+ if not text:
39
+ return ""
40
+ text = text.strip()
41
+ text = re.sub(r"^\s*(final answer|answer)\s*[:\-]\s*", "", text, flags=re.I)
42
+ text = text.strip().strip('"').strip("'")
43
+ return text
44
+
45
+
46
+ def extract_urls(text: str):
47
+ return re.findall(r"https?://[^\s)\]]+", text or "")
48
+
49
+
50
  class BasicAgent:
51
  def __init__(self):
52
+ if not LLM_API_KEY:
53
+ raise ValueError("Missing LLM_API_KEY in Space Secrets.")
54
+ self.client = OpenAI(api_key=LLM_API_KEY, base_url=LLM_BASE_URL)
55
+ self.api_url = DEFAULT_API_URL
56
  print("BasicAgent initialized.")
 
 
 
 
 
57
 
58
+ def download_task_file(self, task_id: str, file_name: str) -> str | None:
59
+ if not file_name:
60
+ return None
61
+
62
+ url = f"{self.api_url}/files/{task_id}"
63
+ print(f"Downloading attached file from {url}")
64
+
65
+ r = requests.get(url, timeout=60)
66
+ if r.status_code != 200:
67
+ print(f"Could not fetch file for task {task_id}: {r.status_code}")
68
+ return None
69
+
70
+ suffix = Path(file_name).suffix or ""
71
+ fd, tmp_path = tempfile.mkstemp(suffix=suffix)
72
+ os.close(fd)
73
+ with open(tmp_path, "wb") as f:
74
+ f.write(r.content)
75
+ return tmp_path
76
+
77
+ def read_text_like_file(self, file_path: str) -> str | None:
78
+ suffix = Path(file_path).suffix.lower()
79
+ if suffix not in {".txt", ".md", ".json", ".csv", ".py", ".html"}:
80
+ return None
81
+
82
+ try:
83
+ with open(file_path, "r", encoding="utf-8", errors="ignore") as f:
84
+ data = f.read()
85
+ return data[:15000]
86
+ except Exception as e:
87
+ return f"[Could not read text file: {e}]"
88
+
89
+ def summarize_spreadsheet(self, file_path: str) -> str:
90
+ try:
91
+ xls = pd.ExcelFile(file_path)
92
+ out = []
93
+ for sheet_name in xls.sheet_names[:3]:
94
+ df = pd.read_excel(file_path, sheet_name=sheet_name)
95
+ out.append(f"Sheet: {sheet_name}")
96
+ out.append("Columns: " + ", ".join(map(str, df.columns.tolist())))
97
+ out.append("Preview:")
98
+ out.append(df.head(20).to_csv(index=False))
99
+ out.append("")
100
+ return "\n".join(out)[:15000]
101
+ except Exception as e:
102
+ return f"[Could not read spreadsheet: {e}]"
103
+
104
+ def transcribe_audio(self, file_path: str) -> str:
105
+ try:
106
+ with open(file_path, "rb") as audio_file:
107
+ transcript = self.client.audio.transcriptions.create(
108
+ model=TRANSCRIBE_MODEL,
109
+ file=audio_file,
110
+ )
111
+ text = getattr(transcript, "text", "") or ""
112
+ return text[:12000]
113
+ except Exception as e:
114
+ return f"[Could not transcribe audio: {e}]"
115
+
116
+ def fetch_web_context(self, question: str) -> str:
117
+ urls = extract_urls(question)
118
+ if not urls:
119
+ return ""
120
+
121
+ chunks = []
122
+ for url in urls[:2]:
123
+ try:
124
+ r = requests.get(url, timeout=30, headers={"User-Agent": "Mozilla/5.0"})
125
+ content = r.text[:12000]
126
+ chunks.append(f"URL: {url}\nCONTENT:\n{content}\n")
127
+ except Exception as e:
128
+ chunks.append(f"URL: {url}\n[Could not fetch: {e}]")
129
+ return "\n\n".join(chunks)
130
+
131
+ def ask_model(self, question: str, extra_context: str = "", image_paths=None) -> str:
132
+ image_paths = image_paths or []
133
+
134
+ system_prompt = (
135
+ "You solve benchmark questions carefully.\n"
136
+ "Return ONLY the final answer.\n"
137
+ "Do not add explanations.\n"
138
+ "Do not add 'FINAL ANSWER'.\n"
139
+ "Keep formatting exactly as requested in the question.\n"
140
+ "If the question asks for alphabetical order, preserve it.\n"
141
+ "If it asks for comma-separated output, return only that comma-separated output.\n"
142
+ "If it asks for a name, return only the name requested.\n"
143
+ )
144
+
145
+ user_parts = []
146
+ user_parts.append({
147
+ "type": "text",
148
+ "text": f"QUESTION:\n{question}\n\nEXTRA CONTEXT:\n{extra_context[:20000]}"
149
+ })
150
+
151
+ for img in image_paths[:3]:
152
+ user_parts.append({
153
+ "type": "image_url",
154
+ "image_url": {"url": to_data_url(img)}
155
+ })
156
+
157
+ response = self.client.chat.completions.create(
158
+ model=MODEL_NAME,
159
+ temperature=0,
160
+ messages=[
161
+ {"role": "system", "content": system_prompt},
162
+ {"role": "user", "content": user_parts},
163
+ ],
164
+ )
165
+
166
+ answer = response.choices[0].message.content or ""
167
+ return clean_final_answer(answer)
168
+
169
+ def __call__(self, task: dict) -> str:
170
+ task_id = task.get("task_id", "")
171
+ question = task.get("question", "")
172
+ file_name = task.get("file_name", "") or ""
173
+
174
+ print(f"Task {task_id} | file_name={file_name}")
175
+
176
+ extra_context = []
177
+ image_paths = []
178
+
179
+ # 1) Fetch webpage content if URLs appear in the question
180
+ web_context = self.fetch_web_context(question)
181
+ if web_context:
182
+ extra_context.append("WEB CONTEXT:\n" + web_context)
183
+
184
+ # 2) Download attached file if any
185
+ local_file = None
186
+ if file_name:
187
+ local_file = self.download_task_file(task_id, file_name)
188
+
189
+ # 3) Handle attachment types
190
+ if local_file:
191
+ suffix = Path(local_file).suffix.lower()
192
+
193
+ if suffix in {".png", ".jpg", ".jpeg", ".webp"}:
194
+ image_paths.append(local_file)
195
+
196
+ elif suffix in {".mp3", ".wav", ".m4a", ".mpeg"}:
197
+ transcript = self.transcribe_audio(local_file)
198
+ extra_context.append("AUDIO TRANSCRIPT:\n" + transcript)
199
+
200
+ elif suffix in {".xlsx", ".xls"}:
201
+ sheet_summary = self.summarize_spreadsheet(local_file)
202
+ extra_context.append("SPREADSHEET CONTENT:\n" + sheet_summary)
203
+
204
+ else:
205
+ text_data = self.read_text_like_file(local_file)
206
+ if text_data:
207
+ extra_context.append(f"ATTACHED FILE CONTENT ({file_name}):\n{text_data}")
208
+
209
+ # 4) Ask model
210
+ final_answer = self.ask_model(
211
+ question=question,
212
+ extra_context="\n\n".join(extra_context),
213
+ image_paths=image_paths,
214
+ )
215
+
216
+ print(f"Final answer for task {task_id}: {final_answer}")
217
+ return final_answer
218
+
219
+
220
+ def run_and_submit_all(profile: gr.OAuthProfile | None):
221
  """
222
  Fetches all questions, runs the BasicAgent on them, submits all answers,
223
  and displays the results.
224
  """
225
+ space_id = os.getenv("SPACE_ID")
 
226
 
227
  if profile:
228
+ username = f"{profile.username}"
229
  print(f"User logged in: {username}")
230
  else:
231
  print("User not logged in.")
 
235
  questions_url = f"{api_url}/questions"
236
  submit_url = f"{api_url}/submit"
237
 
 
238
  try:
239
  agent = BasicAgent()
240
  except Exception as e:
241
  print(f"Error instantiating agent: {e}")
242
  return f"Error initializing agent: {e}", None
243
+
244
  agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main"
245
  print(agent_code)
246
 
 
247
  print(f"Fetching questions from: {questions_url}")
248
  try:
249
+ response = requests.get(questions_url, timeout=30)
250
  response.raise_for_status()
251
  questions_data = response.json()
252
  if not questions_data:
253
+ return "Fetched questions list is empty or invalid format.", None
 
254
  print(f"Fetched {len(questions_data)} questions.")
 
 
 
 
 
 
 
255
  except Exception as e:
256
+ return f"Error fetching questions: {e}", None
 
257
 
 
258
  results_log = []
259
  answers_payload = []
260
+
261
  print(f"Running agent on {len(questions_data)} questions...")
262
  for item in questions_data:
263
  task_id = item.get("task_id")
264
  question_text = item.get("question")
265
  if not task_id or question_text is None:
266
+ print(f"Skipping invalid item: {item}")
267
  continue
268
+
269
  try:
270
+ submitted_answer = agent(item)
271
+ answers_payload.append({
272
+ "task_id": task_id,
273
+ "submitted_answer": submitted_answer
274
+ })
275
+ results_log.append({
276
+ "Task ID": task_id,
277
+ "Question": question_text,
278
+ "File": item.get("file_name", ""),
279
+ "Submitted Answer": submitted_answer
280
+ })
281
  except Exception as e:
282
+ print(f"Error running agent on task {task_id}: {e}")
283
+ results_log.append({
284
+ "Task ID": task_id,
285
+ "Question": question_text,
286
+ "File": item.get("file_name", ""),
287
+ "Submitted Answer": f"AGENT ERROR: {e}"
288
+ })
289
 
290
  if not answers_payload:
 
291
  return "Agent did not produce any answers to submit.", pd.DataFrame(results_log)
292
 
293
+ submission_data = {
294
+ "username": username.strip(),
295
+ "agent_code": agent_code,
296
+ "answers": answers_payload
297
+ }
298
 
 
299
  print(f"Submitting {len(answers_payload)} answers to: {submit_url}")
300
  try:
301
+ response = requests.post(submit_url, json=submission_data, timeout=120)
302
  response.raise_for_status()
303
  result_data = response.json()
304
+
305
  final_status = (
306
  f"Submission Successful!\n"
307
  f"User: {result_data.get('username')}\n"
 
309
  f"({result_data.get('correct_count', '?')}/{result_data.get('total_attempted', '?')} correct)\n"
310
  f"Message: {result_data.get('message', 'No message received.')}"
311
  )
312
+
313
  results_df = pd.DataFrame(results_log)
314
  return final_status, results_df
315
+
316
  except requests.exceptions.HTTPError as e:
317
  error_detail = f"Server responded with status {e.response.status_code}."
318
  try:
319
  error_json = e.response.json()
320
  error_detail += f" Detail: {error_json.get('detail', e.response.text)}"
321
+ except Exception:
322
  error_detail += f" Response: {e.response.text[:500]}"
323
+ return f"Submission Failed: {error_detail}", pd.DataFrame(results_log)
324
+
 
 
325
  except requests.exceptions.Timeout:
326
+ return "Submission Failed: The request timed out.", pd.DataFrame(results_log)
327
+
 
 
328
  except requests.exceptions.RequestException as e:
329
+ return f"Submission Failed: Network error - {e}", pd.DataFrame(results_log)
330
+
 
 
331
  except Exception as e:
332
+ return f"An unexpected error occurred during submission: {e}", pd.DataFrame(results_log)
 
 
 
333
 
334
 
 
335
  with gr.Blocks() as demo:
336
  gr.Markdown("# Basic Agent Evaluation Runner")
337
  gr.Markdown(
338
  """
339
  **Instructions:**
340
+ 1. Edit this Space to define your agent's logic and tools.
341
+ 2. Log in to your Hugging Face account using the button below.
342
+ 3. Click 'Run Evaluation & Submit All Answers' to fetch questions, run your agent, submit answers, and see the score.
 
 
 
 
 
 
343
  """
344
  )
345
 
346
  gr.LoginButton()
 
347
  run_button = gr.Button("Run Evaluation & Submit All Answers")
 
348
  status_output = gr.Textbox(label="Run Status / Submission Result", lines=5, interactive=False)
 
349
  results_table = gr.DataFrame(label="Questions and Agent Answers", wrap=True)
350
 
351
  run_button.click(
 
354
  )
355
 
356
  if __name__ == "__main__":
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
357
  demo.launch(debug=True, share=False)