Final_Assignment_Template

Sleeping

App Files Files Community

thinhbtt commited on Nov 13, 2025

Commit

c3887a9

verified ·

1 Parent(s): e3e2f42

Update app.py

Browse files

Files changed (1) hide show

app.py +353 -126

app.py CHANGED Viewed

@@ -1,107 +1,353 @@
 import os
-import gradio as gr
 import requests
 import pandas as pd
-import re
-# -----------------------------------------------
-# CONSTANTS
-# -----------------------------------------------
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
-# -----------------------------------------------
-# BASIC RULE-BASED AGENT (Không dùng OpenAI)
-# -----------------------------------------------
 class BasicAgent:
     def __init__(self):
-        print("Rule-Based Agent initialized.")
-    # ---------- 1. Solve math expressions ----------
     def solve_math(self, text):
-        # detect simple arithmetic 1+2, 5*7, 10/2...
         expr = re.findall(r"[-+]?\d+\.?\d*|\+|\-|\*|\/", text)
         if len(expr) >= 3:
             try:
-                result = eval("".join(expr))
-                if isinstance(result, float) and result.is_integer():
-                    result = int(result)
-                return str(result)
-            except:
                 return None
         return None
-    # ---------- 2. Count characters inside quotes ----------
     def solve_counting(self, text):
-        m = re.search(r'"(.*?)"', text)
         if m:
             return str(len(m.group(1)))
         return None
-    # ---------- 3. If question asks for “how many words” ----------
-    def solve_word_count(self, text):
-        m = re.search(r'count the words in "(.*?)"', text.lower())
-        if m:
-            return str(len(m.group(1).split()))
-        return None
-    # ---------- 4. Simple factual patterns ----------
-    def solve_simple_fact(self, text):
-        text_lower = text.lower()
-        if "capital of france" in text_lower:
             return "Paris"
-        if "capital of japan" in text_lower:
             return "Tokyo"
-        if "pi to 2 decimals" in text_lower:
             return "3.14"
         return None
-    # ---------- MAIN CALL ----------
-    def __call__(self, question: str) -> str:
-        print(f"Agent solving: {question[:50]}...")
         # 1. math
-        ans = self.solve_math(question)
         if ans:
-            print("→ Math solved:", ans)
             return ans
-        # 2. char counting
-        ans = self.solve_counting(question)
         if ans:
-            print("→ Counting solved:", ans)
             return ans
-        # 3. word counting
-        ans = self.solve_word_count(question)
         if ans:
-            print("→ Word count solved:", ans)
             return ans
-        # 4. simple fact patterns
-        ans = self.solve_simple_fact(question)
         if ans:
-            print("→ Fact solved:", ans)
             return ans
-        # default fallback
-        print("→ No rule matched → returning fallback")
         return "unknown"
-# ---------------------------------------------------------
-# SUBMISSION + UI CODE (giữ nguyên, không chỉnh sửa)
-# ---------------------------------------------------------
 def run_and_submit_all(profile: gr.OAuthProfile | None):
-    space_id = os.getenv("SPACE_ID")
     if profile:
         username = f"{profile.username}"
-        print(f"User logged in: {username}")
     else:
-        print("User not logged in.")
         return "Please Login to Hugging Face with the button.", None
     api_url = DEFAULT_API_URL
@@ -115,93 +361,74 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
         return f"Error initializing agent: {e}", None
     agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main"
-    print(agent_code)
     # Fetch Questions
     try:
-        response = requests.get(questions_url, timeout=15)
-        response.raise_for_status()
-        questions_data = response.json()
-        print(f"Fetched {len(questions_data)} questions.")
     except Exception as e:
         return f"Error fetching questions: {e}", None
-    # Run Agent
     results_log = []
     answers_payload = []
     for item in questions_data:
         task_id = item.get("task_id")
-        qtext = item.get("question")
-        if not task_id or qtext is None:
             continue
         try:
-            submitted_answer = agent(qtext)
-            answers_payload.append({
-                "task_id": task_id,
-                "submitted_answer": submitted_answer
-            })
-            results_log.append({
-                "Task ID": task_id,
-                "Question": qtext,
-                "Submitted Answer": submitted_answer
-            })
         except Exception as e:
-            results_log.append({
-                "Task ID": task_id,
-                "Question": qtext,
-                "Submitted Answer": f"ERROR: {e}"
-            })
-    # Submit
-    submission_data = {
-        "username": username,
-        "agent_code": agent_code,
-        "answers": answers_payload
-    }
-    try:
-        response = requests.post(submit_url, json=submission_data, timeout=60)
-        response.raise_for_status()
-        result_data = response.json()
         final_status = (
-            f"Submission Successful!\n"
-            f"User: {result_data.get('username')}\n"
-            f"Score: {result_data.get('score')}% "
         )
         return final_status, pd.DataFrame(results_log)
     except Exception as e:
         return f"Submission Failed: {e}", pd.DataFrame(results_log)
-# ---------------------------
-# GRADIO UI
-# ---------------------------
 with gr.Blocks() as demo:
-    gr.Markdown("# Basic Agent Evaluation Runner")
-    gr.Markdown("""
-    **Instructions:**
-    1. Duplicate this space.
-    2. Modify your agent's logic in the BasicAgent class only.
-    3. Login to HuggingFace.
-    4. Press Run Evaluation & Submit.
-    """)
     gr.LoginButton()
     run_button = gr.Button("Run Evaluation & Submit All Answers")
-    status_output = gr.Textbox(label="Run Status / Submission Result", lines=5)
-    results_table = gr.DataFrame(label="Questions and Agent Answers")
-    run_button.click(run_and_submit_all, outputs=[status_output, results_table])
 if __name__ == "__main__":
-    demo.launch()

+# app.py (FULL - Rule-based Level 2 Agent using Wikipedia + file reading + heuristics)
 import os
+import re
+import io
+import time
+import json
 import requests
 import pandas as pd
+import gradio as gr
+# optional imports; agent works without them but will use if available
+try:
+    from bs4 import BeautifulSoup
+except Exception:
+    BeautifulSoup = None
+try:
+    import PyPDF2
+except Exception:
+    PyPDF2 = None
+try:
+    from PIL import Image
+    import pytesseract
+except Exception:
+    Image = None
+    pytesseract = None
+# ------------------------------
+# Constants
+# ------------------------------
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
+WIKIPEDIA_API = "https://en.wikipedia.org/w/api.php"
+USER_AGENT = {"User-Agent": "HF-GAIA-Agent/1.0 (contact: you@example.com)"}
+# ------------------------------
+# Utility functions
+# ------------------------------
+def extract_numbers(text):
+    """Return list of numeric strings found in text (integers or floats)."""
+    if not text:
+        return []
+    nums = re.findall(r"\d{1,4}(?:,\d{3})*(?:\.\d+)?|\d+\.\d+|\d+", text.replace("\xa0", " "))
+    # normalize commas
+    clean = [n.replace(",", "") for n in nums]
+    return clean
+def simple_normalize(s):
+    return re.sub(r"\s+", " ", (s or "").strip()).lower()
+def wikipedia_search_first_page(query):
+    """Search wikipedia and return first page title or None."""
+    params = {
+        "action": "query",
+        "list": "search",
+        "srsearch": query,
+        "format": "json",
+        "srlimit": 3,
+    }
+    try:
+        r = requests.get(WIKIPEDIA_API, params=params, headers=USER_AGENT, timeout=10)
+        r.raise_for_status()
+        data = r.json()
+        hits = data.get("query", {}).get("search", [])
+        if hits:
+            return hits[0].get("title")
+    except Exception:
+        return None
+    return None
+def wikipedia_get_extract(title):
+    """Return extract (plain text) for a page title."""
+    params = {
+        "action": "query",
+        "prop": "extracts",
+        "explaintext": 1,
+        "titles": title,
+        "format": "json",
+        "redirects": 1,
+    }
+    try:
+        r = requests.get(WIKIPEDIA_API, params=params, headers=USER_AGENT, timeout=10)
+        r.raise_for_status()
+        data = r.json()
+        pages = data.get("query", {}).get("pages", {})
+        for pid, page in pages.items():
+            return page.get("extract", "")
+    except Exception:
+        return ""
+    return ""
+def wiki_try_find_number(question):
+    """
+    Heuristic: attempt to craft a search query from question and find numeric answers in page extracts.
+    Returns a candidate numeric string or None.
+    """
+    q = question
+    # remove leading "How many" etc to get search hint
+    search_hint = q
+    search_hint = re.sub(r"(?i)how many|between.*|from.*to.*|included.*|in the video.*", "", search_hint)
+    # fallback use whole q
+    title = wikipedia_search_first_page(search_hint)
+    if not title:
+        # try full question
+        title = wikipedia_search_first_page(q)
+    if not title:
+        return None
+    extract = wikipedia_get_extract(title)
+    if not extract:
+        return None
+    # first try: context windows where words from question appear
+    words = re.findall(r"[A-Za-z]{3,}", q)
+    words = [w.lower() for w in words][:6]
+    best_context = extract
+    # find sentences containing relevant keywords
+    sentences = re.split(r'(?<=[\.\?\!])\s+', extract)
+    candidate_nums = []
+    for s in sentences:
+        s_low = s.lower()
+        # prefer sentences that contain several words from question or the phrase 'studio album(s)' etc
+        score = sum(1 for w in words if w in s_low)
+        if score >= 1 or any(k in s_low for k in ["studio album", "album", "species", "population", "released", "released in"]):
+            nums = extract_numbers(s)
+            for n in nums:
+                candidate_nums.append((n, score, s.strip()))
+    if candidate_nums:
+        # sort by score and choose top numeric
+        candidate_nums.sort(key=lambda x: (x[1], len(x[2])), reverse=True)
+        return candidate_nums[0][0]
+    # fallback: any number in extract
+    all_nums = extract_numbers(extract)
+    if all_nums:
+        return all_nums[0]
+    return None
+def fetch_file_text(api_url, task_id):
+    """Call GET /files/{task_id} to fetch file content if present.
+       Returns text or None.
+    """
+    try:
+        files_url = f"{api_url}/files/{task_id}"
+        r = requests.get(files_url, headers=USER_AGENT, timeout=15)
+        if r.status_code == 200:
+            content_type = r.headers.get("Content-Type", "")
+            # some endpoints may return raw text or JSON with 'content' and 'filename'
+            if "application/json" in content_type:
+                j = r.json()
+                # expecting {'filename': ..., 'content': '...'} maybe
+                if isinstance(j, dict):
+                    if j.get("content"):
+                        return j.get("content")
+                    # else maybe direct text in 'text' field
+                    if j.get("text"):
+                        return j.get("text")
+                # else if it's list, return aggregated
+                if isinstance(j, list):
+                    texts = []
+                    for it in j:
+                        if isinstance(it, dict) and "content" in it:
+                            texts.append(it.get("content", ""))
+                    return "\n".join(texts) if texts else None
+            # if raw PDF or binary
+            raw = r.content
+            # try to interpret as text
+            try:
+                text = raw.decode("utf-8")
+                # if readable, return
+                if len(text.strip()) > 20:
+                    return text
+            except Exception:
+                pass
+            # try pdf via PyPDF2 if available
+            if PyPDF2 is not None:
+                try:
+                    reader = PyPDF2.PdfReader(io.BytesIO(raw))
+                    pages = []
+                    for p in reader.pages:
+                        try:
+                            pages.append(p.extract_text() or "")
+                        except Exception:
+                            continue
+                    return "\n".join(pages).strip() or None
+                except Exception:
+                    pass
+            # lastly if image and pytesseract available
+            if Image is not None and pytesseract is not None:
+                try:
+                    img = Image.open(io.BytesIO(raw))
+                    txt = pytesseract.image_to_string(img)
+                    return txt
+                except Exception:
+                    pass
+    except Exception:
+        pass
+    return None
+def youtube_oembed_title_desc(url):
+    """Try to get title/description using oembed """
+    try:
+        oembed_url = "https://www.youtube.com/oembed"
+        r = requests.get(oembed_url, params={"url": url, "format": "json"}, headers=USER_AGENT, timeout=10)
+        if r.status_code == 200:
+            j = r.json()
+            title = j.get("title", "")
+            # description often not present in oembed; return title
+            return title
+    except Exception:
+        pass
+    # try noembed
+    try:
+        r = requests.get("https://noembed.com/embed", params={"url": url}, headers=USER_AGENT, timeout=10)
+        if r.status_code == 200:
+            j = r.json()
+            return j.get("title", "") + " " + (j.get("description") or "")
+    except Exception:
+        pass
+    return ""
+# ------------------------------
+# Agent
+# ------------------------------
 class BasicAgent:
     def __init__(self):
+        print("Level-2 Rule Agent initialized (wiki + file tools).")
+        self.api_url = DEFAULT_API_URL
     def solve_math(self, text):
         expr = re.findall(r"[-+]?\d+\.?\d*|\+|\-|\*|\/", text)
+        # if pattern like "What is 12 + 5?" or "12 + 5 = ?"
         if len(expr) >= 3:
             try:
+                # join tokens but ensure it's a safe expression (only digits and ops)
+                safe = "".join(expr)
+                # limit length
+                if len(safe) < 100:
+                    res = eval(safe)
+                    if isinstance(res, float) and res.is_integer():
+                        res = int(res)
+                    return str(res)
+            except Exception:
                 return None
         return None
     def solve_counting(self, text):
+        # detect patterns like 'how many characters in "..."' or 'How many words in "..."'
+        m = re.search(r'how many characters in\s*"(.*?)"', text, re.I)
         if m:
             return str(len(m.group(1)))
+        m2 = re.search(r'how many words in\s*"(.*?)"', text, re.I)
+        if m2:
+            return str(len(m2.group(1).split()))
+        # generic quoted count
+        m3 = re.search(r'"(.*?)"', text)
+        if m3 and ("characters" in text.lower() or "how many" in text.lower()):
+            return str(len(m3.group(1)))
         return None
+    def solve_simple_facts(self, text):
+        t = text.lower()
+        # trivial mappings
+        if "capital of france" in t:
             return "Paris"
+        if "capital of japan" in t:
             return "Tokyo"
+        if "pi to 2 decimals" in t or "pi to 2 decimal" in t:
             return "3.14"
+        # reversed sentence detection (some GAIA items)
+        if re.search(r'\bfi\b$', text.strip(), re.I) or ("reverse" in t and "text" in t):
+            # try a simple reverse of words if that seems to be asked
+            words = text.split()
+            return " ".join(w[::-1] for w in words)
         return None
+    def solve_with_wikipedia(self, question, task_id=None):
+        """Try to use wiki heuristics to find numeric answers."""
+        try:
+            # If the question contains a specific URL to analyze (youtube), handle that
+            m = re.search(r'https?://[^\s]+', question)
+            if m:
+                url = m.group(0)
+                # youtube special handling
+                if "youtube.com" in url or "youtu.be" in url:
+                    txt = youtube_oembed_title_desc(url)
+                    if txt:
+                        nums = extract_numbers(txt)
+                        if nums:
+                            return nums[0]
+                # if other URL, try fetching content
+                try:
+                    r = requests.get(url, headers=USER_AGENT, timeout=10)
+                    r.raise_for_status()
+                    page_text = r.text
+                    nums = extract_numbers(page_text)
+                    if nums:
+                        return nums[0]
+                except Exception:
+                    pass
+            # try to fetch possible file text via dataset files route (some tasks have attachments)
+            if task_id:
+                file_text = fetch_file_text(self.api_url, task_id)
+                if file_text:
+                    n = extract_numbers(file_text)
+                    if n:
+                        return n[0]
+                    # else attempt basic string match
+                    return None
+            # else try wikipedia search heuristics
+            candidate = wiki_try_find_number(question)
+            if candidate:
+                return candidate
+        except Exception:
+            return None
+        return None
+    def __call__(self, question: str, task_id: str = None) -> str:
+        q = question or ""
+        print("Solving question:", q[:80].replace("\n", " ") + "...")
         # 1. math
+        ans = self.solve_math(q)
         if ans:
             return ans
+        # 2. counting
+        ans = self.solve_counting(q)
         if ans:
             return ans
+        # 3. trivial facts / simple patterns
+        ans = self.solve_simple_facts(q)
         if ans:
             return ans
+        # 4. wikipedia / files / url heuristics
+        ans = self.solve_with_wikipedia(q, task_id=task_id)
         if ans:
             return ans
+        # fallback
         return "unknown"
+# ------------------------------
+# Submission runner
+# ------------------------------
 def run_and_submit_all(profile: gr.OAuthProfile | None):
+    """
+    Fetches all questions, runs the BasicAgent on them, submits all answers,
+    and displays the results.
+    """
+    space_id = os.getenv("SPACE_ID") or "unknown-space"
     if profile:
         username = f"{profile.username}"
     else:
         return "Please Login to Hugging Face with the button.", None
     api_url = DEFAULT_API_URL
         return f"Error initializing agent: {e}", None
     agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main"
     # Fetch Questions
     try:
+        r = requests.get(questions_url, headers=USER_AGENT, timeout=15)
+        r.raise_for_status()
+        questions_data = r.json()
+        if not isinstance(questions_data, list):
+            return "Questions endpoint returned invalid format.", None
     except Exception as e:
         return f"Error fetching questions: {e}", None
     results_log = []
     answers_payload = []
     for item in questions_data:
         task_id = item.get("task_id")
+        question_text = item.get("question")
+        if not task_id or question_text is None:
             continue
         try:
+            ans = agent(question_text, task_id=task_id)
+            # ensure answers are strings
+            submitted_answer = str(ans) if ans is not None else "unknown"
+            answers_payload.append({"task_id": task_id, "submitted_answer": submitted_answer})
+            results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": submitted_answer})
+            time.sleep(0.2)  # polite pause to avoid hammering external services
         except Exception as e:
+            results_log.append({"Task ID": task_id, "Question": question_text, "Submitted Answer": f"ERROR: {e}"})
+    if not answers_payload:
+        return "Agent did not produce any answers.", pd.DataFrame(results_log)
+    submission_data = {"username": username.strip(), "agent_code": agent_code, "answers": answers_payload}
+    try:
+        resp = requests.post(submit_url, json=submission_data, headers=USER_AGENT, timeout=60)
+        resp.raise_for_status()
+        result = resp.json()
         final_status = (
+            f"Submission Successful!\nUser: {result.get('username')}\n"
+            f"Overall Score: {result.get('score', 'N/A')}% "
+            f"({result.get('correct_count', '?')}/{result.get('total_attempted', '?')} correct)\n"
+            f"Message: {result.get('message', '')}"
         )
         return final_status, pd.DataFrame(results_log)
+    except requests.exceptions.HTTPError as e:
+        try:
+            body = e.response.json()
+            detail = body.get("detail") or json.dumps(body)[:400]
+        except Exception:
+            detail = e.response.text[:400]
+        return f"Submission Failed: HTTP {e.response.status_code} - {detail}", pd.DataFrame(results_log)
     except Exception as e:
         return f"Submission Failed: {e}", pd.DataFrame(results_log)
+# ------------------------------
+# Gradio UI
+# ------------------------------
 with gr.Blocks() as demo:
+    gr.Markdown("# Level-2 Agent (Rule-based + Wiki/File Tools)")
+    gr.Markdown(
+        "Duplicate this space, make it public, then login and press **Run Evaluation & Submit All Answers**."
+    )
     gr.LoginButton()
     run_button = gr.Button("Run Evaluation & Submit All Answers")
+    status_output = gr.Textbox(label="Run Status / Submission Result", lines=6, interactive=False)
+    results_table = gr.DataFrame(label="Questions and Agent Answers", wrap=True)
+    run_button.click(fn=run_and_submit_all, inputs=[], outputs=[status_output, results_table])
 if __name__ == "__main__":
+    demo.launch(server_name="0.0.0.0", server_port=int(os.environ.get("PORT", 7860)))