Final_Assignment_Template

Sleeping

App Files Files Community

SantoshKumar1310 commited on Oct 27, 2025

Commit

982e82c

verified ·

1 Parent(s): b586840

Update app.py

Browse files

Files changed (1) hide show

app.py +102 -138

app.py CHANGED Viewed

@@ -7,7 +7,7 @@ from typing import Dict, List, Any, Optional
 import json
 # --- Constants ---
-DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space/docs"
 # --- Enhanced GAIA Agent ---
 class GAIAAgent:
@@ -15,11 +15,11 @@ class GAIAAgent:
     Enhanced agent optimized for GAIA Level 1 questions.
     Targets 30%+ accuracy through multi-tool integration.
     """
     def __init__(self):
         print("✅ GAIA Agent initialized with enhanced capabilities.")
         self.api_url = DEFAULT_API_URL
     def __call__(self, question: str, task_id: str = None) -> str:
         """
         Main entry point - processes a question and returns a precise answer.
@@ -28,67 +28,66 @@ class GAIAAgent:
         print(f"🧠 Processing Task: {task_id}")
         print(f"📝 Question: {question[:100]}...")
         print(f"{'='*60}")
         try:
             # Step 1: Classify question type
             q_type = self._classify_question(question)
             print(f"📊 Question Type: {q_type}")
             # Step 2: Route to specialized handler
             answer = self._route_to_handler(question, q_type, task_id)
             # Step 3: Clean and format answer
             final_answer = self._clean_answer(answer, question)
             print(f"✅ Final Answer: {final_answer}")
             return final_answer
         except Exception as e:
             print(f"❌ Error: {e}")
             # Return a safe fallback
             return "Unable to determine answer"
     def _classify_question(self, question: str) -> str:
         """Classify question to route to appropriate handler"""
         q_lower = question.lower()
         # Math/calculation questions
         if any(word in q_lower for word in ["calculate", "sum", "total", "multiply", "divide", "average", "mean"]):
             return "math"
         # Questions with numbers/operators
         if any(op in question for op in ["+", "-", "×", "÷", "*", "/"]) and any(c.isdigit() for c in question):
             return "math"
         # Counting questions
         if any(word in q_lower for word in ["how many", "count", "number of"]):
             return "counting"
         # Date/time questions
         if any(word in q_lower for word in ["year", "date", "when", "month", "day"]):
             return "date"
         # Location questions
         if any(word in q_lower for word in ["where", "location", "city", "country", "capital"]):
             return "location"
         # Definition/what is questions
         if q_lower.startswith("what is") or q_lower.startswith("what's"):
             return "definition"
         # Who questions
         if q_lower.startswith("who"):
             return "person"
         # File-based questions
         if any(word in q_lower for word in ["file", "document", "image", "picture", "photo"]):
             return "file"
         return "general"
     def _route_to_handler(self, question: str, q_type: str, task_id: str) -> str:
         """Route question to appropriate specialized handler"""
         if q_type == "math":
             return self._handle_math(question)
         elif q_type == "counting":
@@ -105,7 +104,7 @@ class GAIAAgent:
             return self._handle_file(question, task_id)
         else:
             return self._handle_general(question)
     def _handle_math(self, question: str) -> str:
         """Handle mathematical calculations"""
         try:
@@ -113,10 +112,10 @@ class GAIAAgent:
             numbers = re.findall(r'-?\d+\.?\d*', question)
             if not numbers:
                 return "0"
             nums = [float(n) for n in numbers]
             q_lower = question.lower()
             # Detect operation
             if "sum" in q_lower or "total" in q_lower or "+" in question or "add" in q_lower:
                 result = sum(nums)
@@ -134,41 +133,41 @@ class GAIAAgent:
                 # Try to evaluate the expression safely
                 expr = re.sub(r'[^0-9+\-*/().\s]', '', question)
                 result = eval(expr, {"__builtins__": {}}, {})
             # Format result
             if result == int(result):
                 return str(int(result))
             else:
                 return f"{result:.2f}"
         except Exception as e:
             print(f"Math error: {e}")
             return "0"
     def _handle_counting(self, question: str) -> str:
         """Handle counting questions"""
         # Extract the first number found (often the answer)
         numbers = re.findall(r'\d+', question)
         return numbers[0] if numbers else "0"
     def _handle_date(self, question: str) -> str:
         """Handle date/year questions"""
         # Look for 4-digit years
         years = re.findall(r'\b(19|20)\d{2}\b', question)
         if years:
             return years[0]
         # Look for dates
         dates = re.findall(r'\b\d{1,2}/\d{1,2}/\d{4}\b', question)
         if dates:
             return dates[0]
         return "Unknown"
     def _handle_location(self, question: str) -> str:
         """Handle location questions using knowledge base"""
         q_lower = question.lower()
         # Common capitals and locations
         location_kb = {
             "france": "Paris",
@@ -186,13 +185,13 @@ class GAIAAgent:
             "spain": "Madrid",
             "madrid": "Spain",
         }
         for key, value in location_kb.items():
             if key in q_lower:
                 return value
         return "Unknown"
     def _handle_definition(self, question: str) -> str:
         """Handle 'What is' questions"""
         # Extract the subject
@@ -201,11 +200,11 @@ class GAIAAgent:
             subject = match.group(1).strip()
             return f"{subject}"
         return "Unknown"
     def _handle_person(self, question: str) -> str:
         """Handle 'Who' questions using knowledge base"""
         q_lower = question.lower()
         # Famous people knowledge base
         people_kb = {
             "romeo and juliet": "William Shakespeare",
@@ -218,28 +217,28 @@ class GAIAAgent:
             "light bulb": "Thomas Edison",
             "first president": "George Washington",
         }
         for key, value in people_kb.items():
             if key in q_lower:
                 return value
         return "Unknown"
     def _handle_file(self, question: str, task_id: str) -> str:
         """Handle questions that require file access"""
         if not task_id:
             return "No file available"
         try:
             # Download the file from API
             file_url = f"{self.api_url}/files/{task_id}"
             print(f"📥 Downloading file from: {file_url}")
             response = requests.get(file_url, timeout=30)
             if response.status_code == 200:
                 # Process file based on type
                 content_type = response.headers.get('Content-Type', '')
                 if 'text' in content_type or 'json' in content_type:
                     # Text-based file
                     content = response.text
@@ -252,20 +251,20 @@ class GAIAAgent:
             else:
                 print(f"File download failed: {response.status_code}")
                 return "File not found"
         except Exception as e:
             print(f"File handling error: {e}")
             return "File processing failed"
     def _analyze_text_file(self, content: str, question: str) -> str:
         """Analyze text file content to answer question"""
         q_lower = question.lower()
         # Counting items in file
         if "how many" in q_lower:
             lines = content.strip().split('\n')
             return str(len(lines))
         # Finding specific text
         if "find" in q_lower or "search" in q_lower:
             # Extract search term
@@ -276,24 +275,24 @@ class GAIAAgent:
                     return "Found"
                 else:
                     return "Not found"
         # Return first line as fallback
         lines = content.strip().split('\n')
         return lines[0] if lines else "Empty file"
     def _handle_general(self, question: str) -> str:
         """Handle general questions with basic reasoning"""
         # Try to extract any numbers or dates
         numbers = re.findall(r'\d+', question)
         if numbers:
             return numbers[0]
         # Look for yes/no questions
         if question.strip().endswith('?') and any(word in question.lower() for word in ['is', 'are', 'was', 'were', 'can', 'could', 'will', 'would']):
             return "Yes"
         return "Unable to determine"
     def _clean_answer(self, answer: str, question: str) -> str:
         """
         Clean and format answer according to GAIA requirements.
@@ -301,18 +300,18 @@ class GAIAAgent:
         """
         # Remove extra whitespace
         answer = answer.strip()
         # Remove "The answer is" or similar phrases
         answer = re.sub(r'^(?:the answer is|it is|result is)[:\s]+', '', answer, flags=re.IGNORECASE)
         # Remove trailing punctuation (except for decimals)
         answer = re.sub(r'[.!?,;]+$', '', answer)
         # Handle comma-separated lists
         if "comma-separated" in question.lower() or "list" in question.lower():
             # Ensure proper comma-space formatting
             answer = re.sub(r'\s*,\s*', ', ', answer)
         # Handle number formatting
         if re.match(r'^-?\d+\.?\d*$', answer):
             # It's a number
@@ -323,7 +322,7 @@ class GAIAAgent:
             else:
                 # Keep minimal decimal places
                 answer = f"{num:.10g}"
         return answer
@@ -341,8 +340,8 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
         return "❌ Please login to Hugging Face first.", None
     api_url = DEFAULT_API_URL
-    questions_url = f"{api_url}/questions"
-    submit_url = f"{api_url}/submit"
     # Create Agent
     try:
@@ -359,43 +358,43 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
         response = requests.get(questions_url, timeout=30)
         response.raise_for_status()
         questions_data = response.json()
         if not questions_data:
             return "⚠️ No questions received from API.", None
         print(f"✅ Retrieved {len(questions_data)} questions.")
     except requests.exceptions.RequestException as e:
         return f"❌ Error fetching questions: {e}\n\nPlease check if the API is available.", None
     # Run Agent on all questions
     results_log = []
     answers_payload = []
     print(f"\n🤖 Running agent on {len(questions_data)} questions...\n")
     for i, item in enumerate(questions_data, 1):
         task_id = item.get("task_id")
         question_text = item.get("question")
         if not task_id or not question_text:
             continue
         try:
             print(f"\n[{i}/{len(questions_data)}] Processing: {task_id}")
             submitted_answer = agent(question_text, task_id)
             answers_payload.append({
                 "task_id": task_id,
                 "submitted_answer": submitted_answer
             })
             results_log.append({
                 "Task ID": task_id,
                 "Question": question_text[:80] + "..." if len(question_text) > 80 else question_text,
                 "Your Answer": submitted_answer
             })
         except Exception as e:
             error_msg = f"ERROR: {e}"
             print(f"❌ {error_msg}")
@@ -422,11 +421,11 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
         response = requests.post(submit_url, json=submission_data, timeout=120)
         response.raise_for_status()
         result_data = response.json()
         score = result_data.get('score', 0)
         correct = result_data.get('correct_count', 0)
         total = result_data.get('total_attempted', len(answers_payload))
         # Determine emoji based on score
         if score >= 30:
             emoji = "🎉🏆"
@@ -436,7 +435,7 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
             emoji = "📈"
         else:
             emoji = "💪"
         final_status = (
             f"{emoji} Submission Complete!\n\n"
             f"👤 Username: {result_data.get('username')}\n"
@@ -445,9 +444,9 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
             f"📝 {result_data.get('message', '')}\n\n"
             f"🔗 Check the leaderboard: https://huggingface.co/spaces/agents-course/agents-course-unit4-leaderboard"
         )
         return final_status, results_df
     except requests.exceptions.RequestException as e:
         return f"❌ Submission failed: {e}\n\n✅ Generated {len(answers_payload)} answers (see table)", results_df
@@ -455,90 +454,56 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
 # --- Gradio Interface ---
 with gr.Blocks(theme=gr.themes.Soft(), title="GAIA Agent Evaluation") as demo:
     gr.Markdown(
-        """
-        # 🤖 GAIA Agent Evaluation System
-        ### 🎯 Goal: Achieve 30%+ accuracy on GAIA Level 1 questions
-        This agent evaluates your AI assistant on 20 carefully selected questions from GAIA's validation set.
-        The questions test reasoning, calculation, factual knowledge, and tool usage.
-        ---
-        ### 📋 How to Submit:
-        1. **Clone this Space** to your Hugging Face profile
-        2. **Keep your Space public** (required for leaderboard verification)
-        3. **Login** using the button below
-        4. **Click "Run Evaluation"** and wait for results
-        5. **Check your score** on the [leaderboard](https://huggingface.co/spaces/agents-course/agents-course-unit4-leaderboard)
-        ---
-        ### 💡 Tips for Improvement:
-        - Study the question types and patterns
-        - Add web search capabilities (DuckDuckGo, Wikipedia)
-        - Implement better answer formatting
-        - Test individual questions using `/random-question` endpoint
-        - Focus on precise, exact-match answers
-        ---
-        ### ⚠️ Important Notes:
-        - Processing takes 2-5 minutes (20 questions)
-        - Answers must be **exact matches** (case-sensitive, format-sensitive)
-        - Keep your Space public for leaderboard verification
-        - The SPACE_ID environment variable is set automatically by HF Spaces
-        """
     )
     with gr.Row():
         gr.LoginButton()
     gr.Markdown("---")
     run_button = gr.Button(
         "🚀 Run Evaluation & Submit All Answers",
         variant="primary",
         size="lg"
     )
     status_output = gr.Textbox(
         label="📊 Evaluation Results",
         lines=12,
         interactive=False,
         show_copy_button=True
     )
     results_table = gr.DataFrame(
         label="📝 Questions and Your Answers",
         wrap=True,
         interactive=False
     )
     gr.Markdown(
-        """
-        ---
-        ### 🔗 Resources:
-        - [GAIA Benchmark Paper](https://arxiv.org/abs/2311.12983)
-        - [Leaderboard](https://huggingface.co/spaces/agents-course/agents-course-unit4-leaderboard)
-        - [Course Materials](https://huggingface.co/learn/cookbook/agents)
-        - [API Documentation](https://agents-course-unit4-scoring.hf.space/docs)
-        ### 🏆 Score Interpretation:
-        - **30%+**: Excellent! You've achieved certification level ✅
-        - **20-29%**: Good progress! Keep improving 📈
-        - **10-19%**: On the right track! Add more tools 🔧
-        - **0-9%**: Keep experimenting! Study the questions 💪
-        Remember: Human performance is ~92%, GPT-4 with plugins is ~15%. You're competing with AI systems!
-        """
     )
     run_button.click(
@@ -546,7 +511,6 @@ with gr.Blocks(theme=gr.themes.Soft(), title="GAIA Agent Evaluation") as demo:
         outputs=[status_output, results_table]
     )
 if __name__ == "__main__":
     print("🚀 Launching GAIA Agent Evaluation Interface...")
-    demo.launch(debug=True, share=False)

 import json
 # --- Constants ---
+DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"  # (no /docs)
 # --- Enhanced GAIA Agent ---
 class GAIAAgent:
     Enhanced agent optimized for GAIA Level 1 questions.
     Targets 30%+ accuracy through multi-tool integration.
     """
     def __init__(self):
         print("✅ GAIA Agent initialized with enhanced capabilities.")
         self.api_url = DEFAULT_API_URL
     def __call__(self, question: str, task_id: str = None) -> str:
         """
         Main entry point - processes a question and returns a precise answer.
         print(f"🧠 Processing Task: {task_id}")
         print(f"📝 Question: {question[:100]}...")
         print(f"{'='*60}")
         try:
             # Step 1: Classify question type
             q_type = self._classify_question(question)
             print(f"📊 Question Type: {q_type}")
             # Step 2: Route to specialized handler
             answer = self._route_to_handler(question, q_type, task_id)
             # Step 3: Clean and format answer
             final_answer = self._clean_answer(answer, question)
             print(f"✅ Final Answer: {final_answer}")
             return final_answer
         except Exception as e:
             print(f"❌ Error: {e}")
             # Return a safe fallback
             return "Unable to determine answer"
     def _classify_question(self, question: str) -> str:
         """Classify question to route to appropriate handler"""
         q_lower = question.lower()
         # Math/calculation questions
         if any(word in q_lower for word in ["calculate", "sum", "total", "multiply", "divide", "average", "mean"]):
             return "math"
         # Questions with numbers/operators
         if any(op in question for op in ["+", "-", "×", "÷", "*", "/"]) and any(c.isdigit() for c in question):
             return "math"
         # Counting questions
         if any(word in q_lower for word in ["how many", "count", "number of"]):
             return "counting"
         # Date/time questions
         if any(word in q_lower for word in ["year", "date", "when", "month", "day"]):
             return "date"
         # Location questions
         if any(word in q_lower for word in ["where", "location", "city", "country", "capital"]):
             return "location"
         # Definition/what is questions
         if q_lower.startswith("what is") or q_lower.startswith("what's"):
             return "definition"
         # Who questions
         if q_lower.startswith("who"):
             return "person"
         # File-based questions
         if any(word in q_lower for word in ["file", "document", "image", "picture", "photo"]):
             return "file"
         return "general"
     def _route_to_handler(self, question: str, q_type: str, task_id: str) -> str:
         """Route question to appropriate specialized handler"""
         if q_type == "math":
             return self._handle_math(question)
         elif q_type == "counting":
             return self._handle_file(question, task_id)
         else:
             return self._handle_general(question)
     def _handle_math(self, question: str) -> str:
         """Handle mathematical calculations"""
         try:
             numbers = re.findall(r'-?\d+\.?\d*', question)
             if not numbers:
                 return "0"
             nums = [float(n) for n in numbers]
             q_lower = question.lower()
             # Detect operation
             if "sum" in q_lower or "total" in q_lower or "+" in question or "add" in q_lower:
                 result = sum(nums)
                 # Try to evaluate the expression safely
                 expr = re.sub(r'[^0-9+\-*/().\s]', '', question)
                 result = eval(expr, {"__builtins__": {}}, {})
             # Format result
             if result == int(result):
                 return str(int(result))
             else:
                 return f"{result:.2f}"
         except Exception as e:
             print(f"Math error: {e}")
             return "0"
     def _handle_counting(self, question: str) -> str:
         """Handle counting questions"""
         # Extract the first number found (often the answer)
         numbers = re.findall(r'\d+', question)
         return numbers[0] if numbers else "0"
     def _handle_date(self, question: str) -> str:
         """Handle date/year questions"""
         # Look for 4-digit years
         years = re.findall(r'\b(19|20)\d{2}\b', question)
         if years:
             return years[0]
         # Look for dates
         dates = re.findall(r'\b\d{1,2}/\d{1,2}/\d{4}\b', question)
         if dates:
             return dates[0]
         return "Unknown"
     def _handle_location(self, question: str) -> str:
         """Handle location questions using knowledge base"""
         q_lower = question.lower()
         # Common capitals and locations
         location_kb = {
             "france": "Paris",
             "spain": "Madrid",
             "madrid": "Spain",
         }
         for key, value in location_kb.items():
             if key in q_lower:
                 return value
         return "Unknown"
     def _handle_definition(self, question: str) -> str:
         """Handle 'What is' questions"""
         # Extract the subject
             subject = match.group(1).strip()
             return f"{subject}"
         return "Unknown"
     def _handle_person(self, question: str) -> str:
         """Handle 'Who' questions using knowledge base"""
         q_lower = question.lower()
         # Famous people knowledge base
         people_kb = {
             "romeo and juliet": "William Shakespeare",
             "light bulb": "Thomas Edison",
             "first president": "George Washington",
         }
         for key, value in people_kb.items():
             if key in q_lower:
                 return value
         return "Unknown"
     def _handle_file(self, question: str, task_id: str) -> str:
         """Handle questions that require file access"""
         if not task_id:
             return "No file available"
         try:
             # Download the file from API
             file_url = f"{self.api_url}/files/{task_id}"
             print(f"📥 Downloading file from: {file_url}")
             response = requests.get(file_url, timeout=30)
             if response.status_code == 200:
                 # Process file based on type
                 content_type = response.headers.get('Content-Type', '')
                 if 'text' in content_type or 'json' in content_type:
                     # Text-based file
                     content = response.text
             else:
                 print(f"File download failed: {response.status_code}")
                 return "File not found"
         except Exception as e:
             print(f"File handling error: {e}")
             return "File processing failed"
     def _analyze_text_file(self, content: str, question: str) -> str:
         """Analyze text file content to answer question"""
         q_lower = question.lower()
         # Counting items in file
         if "how many" in q_lower:
             lines = content.strip().split('\n')
             return str(len(lines))
         # Finding specific text
         if "find" in q_lower or "search" in q_lower:
             # Extract search term
                     return "Found"
                 else:
                     return "Not found"
         # Return first line as fallback
         lines = content.strip().split('\n')
         return lines[0] if lines else "Empty file"
     def _handle_general(self, question: str) -> str:
         """Handle general questions with basic reasoning"""
         # Try to extract any numbers or dates
         numbers = re.findall(r'\d+', question)
         if numbers:
             return numbers[0]
         # Look for yes/no questions
         if question.strip().endswith('?') and any(word in question.lower() for word in ['is', 'are', 'was', 'were', 'can', 'could', 'will', 'would']):
             return "Yes"
         return "Unable to determine"
     def _clean_answer(self, answer: str, question: str) -> str:
         """
         Clean and format answer according to GAIA requirements.
         """
         # Remove extra whitespace
         answer = answer.strip()
         # Remove "The answer is" or similar phrases
         answer = re.sub(r'^(?:the answer is|it is|result is)[:\s]+', '', answer, flags=re.IGNORECASE)
         # Remove trailing punctuation (except for decimals)
         answer = re.sub(r'[.!?,;]+$', '', answer)
         # Handle comma-separated lists
         if "comma-separated" in question.lower() or "list" in question.lower():
             # Ensure proper comma-space formatting
             answer = re.sub(r'\s*,\s*', ', ', answer)
         # Handle number formatting
         if re.match(r'^-?\d+\.?\d*$', answer):
             # It's a number
             else:
                 # Keep minimal decimal places
                 answer = f"{num:.10g}"
         return answer
         return "❌ Please login to Hugging Face first.", None
     api_url = DEFAULT_API_URL
+    questions_url = f"{api_url}/questions"     # Corrected endpoint
+    submit_url = f"{api_url}/submit"           # Corrected endpoint
     # Create Agent
     try:
         response = requests.get(questions_url, timeout=30)
         response.raise_for_status()
         questions_data = response.json()
         if not questions_data:
             return "⚠️ No questions received from API.", None
         print(f"✅ Retrieved {len(questions_data)} questions.")
     except requests.exceptions.RequestException as e:
         return f"❌ Error fetching questions: {e}\n\nPlease check if the API is available.", None
     # Run Agent on all questions
     results_log = []
     answers_payload = []
     print(f"\n🤖 Running agent on {len(questions_data)} questions...\n")
     for i, item in enumerate(questions_data, 1):
         task_id = item.get("task_id")
         question_text = item.get("question")
         if not task_id or not question_text:
             continue
         try:
             print(f"\n[{i}/{len(questions_data)}] Processing: {task_id}")
             submitted_answer = agent(question_text, task_id)
             answers_payload.append({
                 "task_id": task_id,
                 "submitted_answer": submitted_answer
             })
             results_log.append({
                 "Task ID": task_id,
                 "Question": question_text[:80] + "..." if len(question_text) > 80 else question_text,
                 "Your Answer": submitted_answer
             })
         except Exception as e:
             error_msg = f"ERROR: {e}"
             print(f"❌ {error_msg}")
         response = requests.post(submit_url, json=submission_data, timeout=120)
         response.raise_for_status()
         result_data = response.json()
         score = result_data.get('score', 0)
         correct = result_data.get('correct_count', 0)
         total = result_data.get('total_attempted', len(answers_payload))
         # Determine emoji based on score
         if score >= 30:
             emoji = "🎉🏆"
             emoji = "📈"
         else:
             emoji = "💪"
         final_status = (
             f"{emoji} Submission Complete!\n\n"
             f"👤 Username: {result_data.get('username')}\n"
             f"📝 {result_data.get('message', '')}\n\n"
             f"🔗 Check the leaderboard: https://huggingface.co/spaces/agents-course/agents-course-unit4-leaderboard"
         )
         return final_status, results_df
     except requests.exceptions.RequestException as e:
         return f"❌ Submission failed: {e}\n\n✅ Generated {len(answers_payload)} answers (see table)", results_df
 # --- Gradio Interface ---
 with gr.Blocks(theme=gr.themes.Soft(), title="GAIA Agent Evaluation") as demo:
     gr.Markdown(
+    """
+    # 🤖 GAIA Agent Evaluation System
+    ### 🎯 Goal: Achieve 30%+ accuracy on GAIA Level 1 questions
+    This agent evaluates your AI assistant on 20 carefully selected questions from GAIA's validation set.
+    The questions test reasoning, calculation, factual knowledge, and tool usage.
+    ---
+    Please clone this space, log in, and click 'Run Evaluation' to see your score!
+    """
     )
     with gr.Row():
         gr.LoginButton()
     gr.Markdown("---")
     run_button = gr.Button(
         "🚀 Run Evaluation & Submit All Answers",
         variant="primary",
         size="lg"
     )
     status_output = gr.Textbox(
         label="📊 Evaluation Results",
         lines=12,
         interactive=False,
         show_copy_button=True
     )
     results_table = gr.DataFrame(
         label="📝 Questions and Your Answers",
         wrap=True,
         interactive=False
     )
     gr.Markdown(
+    """
+    ---
+    ### 🔗 Resources:
+    - [GAIA Benchmark Paper](https://arxiv.org/abs/2311.12983)
+    - [Leaderboard](https://huggingface.co/spaces/agents-course/agents-course-unit4-leaderboard)
+    - [Course Materials](https://huggingface.co/learn/cookbook/agents)
+    - [API Documentation](https://agents-course-unit4-scoring.hf.space/docs)
+    ---
+    """
     )
     run_button.click(
         outputs=[status_output, results_table]
     )
 if __name__ == "__main__":
     print("🚀 Launching GAIA Agent Evaluation Interface...")
+    demo.launch(debug=True, share=False)