Final_Assignment_Template

Sleeping

App Files Files Community

beyzapehlivan commited on 24 days ago

Commit

af175c6

verified ·

1 Parent(s): 08647f9

Update app.py

Browse files

Files changed (1) hide show

app.py +39 -73

app.py CHANGED Viewed

@@ -2,73 +2,43 @@ import os
 import gradio as gr
 import requests
 import pandas as pd
-# ADDED BY BEYZAPEHLIVAN
 from smolagents import CodeAgent, HfApiModel, DuckDuckGoSearchTool, VisitWebpageTool
-# (Keep Constants as is)
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
-# --- Basic Agent Definition ---
-# ----- THIS IS WERE YOU CAN BUILD WHAT YOU WANT ------
-# --- YENİ ALFRED AJANI ---
 token = os.getenv("HF_TOKEN")
-model = HfApiModel(model_id="Qwen/Qwen2.5-72B-Instruct", token=token)
 class AlfredAgent:
     def __init__(self):
-        CUSTOM_SYSTEM_PROMPT = """You are a helpful and agile assistant that has access to a set of tools.
-For every step, you must provide your reasoning in a 'Thoughts:' section and then the tool call in a 'Code:' section.
-Format:
-Thoughts: I need to search for...
-Code:
-```py
-print(web_search("question"))
-```<end_action>
-Rules:
-1. Provide ONLY the final answer value. No sentences.
-2. For dates, use YYYY-MM-DD.
-3. If you find the info, stop and give the answer immediately.
-Tools:
-{{managed_agents_descriptions}}
-{{authorized_imports}}"""
         self.agent = CodeAgent(
             tools=[VisitWebpageTool(), DuckDuckGoSearchTool()],
             model=model,
-            max_steps=10,
-            add_base_tools=False,
-            planning_interval=2,
             system_prompt=CUSTOM_SYSTEM_PROMPT
         )
     def __call__(self, question: str) -> str:
         try:
-            # Soruya net kural ekliyoruz
-            full_prompt = f"Solve this GAIA task precisely: {question}. Return ONLY the value."
-            result = self.agent.run(full_prompt)
-            # İlk temizlik
             ans = str(result).strip()
-            # Eğer model "Final Answer: 1928" dediyse sadece 1928'i al
-            if "Final Answer:" in ans:
-                ans = ans.split("Final Answer:")[-1].strip()
-            # Kelime bazlı temizlik (gereksiz ekleri atar)
-            for word in ["is:", "answer:", "result:", "the answer is"]:
-                if word in ans.lower():
-                    ans = ans.lower().split(word)[-1].strip()
-            # Hala çok uzunsa (muhtemelen paragraf yazdı), sadece en son satırı/kelimeyi al
-            if len(ans) > 60:
-                ans = ans.split('\n')[-1].strip(" .\"'")
             return ans
-        except Exception:
-            # Hata anında bile "None" yerine "Unknown" dönerek formatı koruyoruz
             return "Unknown"
 def run_and_submit_all( profile: gr.OAuthProfile | None):
@@ -121,7 +91,7 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
         print(f"An unexpected error occurred fetching questions: {e}")
         return f"An unexpected error occurred fetching questions: {e}", None
-    # 3. Run your Agent (Bu kısmı bul ve değiştir)
     results_log = []
     answers_payload = []
@@ -198,31 +168,27 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
 # --- Build Gradio Interface using Blocks ---
-with gr.Blocks() as demo:
-    gr.Markdown("# Basic Agent Evaluation Runner")
-    gr.Markdown(
-        """
-        **Instructions:**
-        1.  Please clone this space, then modify the code to define your agent's logic, the tools, the necessary packages, etc ...
-        2.  Log in to your Hugging Face account using the button below. This uses your HF username for submission.
-        3.  Click 'Run Evaluation & Submit All Answers' to fetch questions, run your agent, submit answers, and see the score.
-        ---
-        **Disclaimers:**
-        Once clicking on the "submit button, it can take quite some time ( this is the time for the agent to go through all the questions).
-        This space provides a basic setup and is intentionally sub-optimal to encourage you to develop your own, more robust solution. For instance for the delay process of the submit button, a solution could be to cache the answers and submit in a seperate action or even to answer the questions in async.
-        """
-    )
-    gr.LoginButton()
-    run_button = gr.Button("Run Evaluation & Submit All Answers")
-    status_output = gr.Textbox(label="Run Status / Submission Result", lines=5, interactive=False)
-    # Removed max_rows=10 from DataFrame constructor
-    results_table = gr.DataFrame(label="Questions and Agent Answers", wrap=True)
     run_button.click(
         fn=run_and_submit_all,
         outputs=[status_output, results_table]

 import gradio as gr
 import requests
 import pandas as pd
 from smolagents import CodeAgent, HfApiModel, DuckDuckGoSearchTool, VisitWebpageTool
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 token = os.getenv("HF_TOKEN")
+model = HfApiModel(model_id="meta-llama/Llama-3.1-70B-Instruct", token=token)
 class AlfredAgent:
     def __init__(self):
+        # %30 BARACI İÇİN KRİTİK PROMPT
+        CUSTOM_SYSTEM_PROMPT = """You are a world-class GAIA solver.
+        1. Use web_search for facts.
+        2. Use visit_webpage for specific URLs or deep reading.
+        3. If you find multiple numbers, verify which one exactly answers the question.
+        4. Your final output must be ONLY the result (e.g., '15', 'Paris', '2022-03-01'). No explanations."""
         self.agent = CodeAgent(
             tools=[VisitWebpageTool(), DuckDuckGoSearchTool()],
             model=model,
+            max_steps=15, # Soruları yarım bırakmaması için artırdık
+            add_base_tools=True,
+            additional_authorized_imports=['requests', 'bs4', 'pandas', 'json', 'math'],
             system_prompt=CUSTOM_SYSTEM_PROMPT
         )
     def __call__(self, question: str) -> str:
         try:
+            # Planlı düşünme ve çözme
+            result = self.agent.run(f"Carefully solve this task and give a concise final answer: {question}")
             ans = str(result).strip()
+            # Gereksiz kalabalığı temizleyen final filtresi
+            if len(ans) > 50:
+                ans = ans.split('\n')[-1].replace("Final Answer:", "").strip(" .\"'")
             return ans
+        except Exception as e:
+            print(f"Agent Error: {e}")
             return "Unknown"
 def run_and_submit_all( profile: gr.OAuthProfile | None):
         print(f"An unexpected error occurred fetching questions: {e}")
         return f"An unexpected error occurred fetching questions: {e}", None
+    # 3. Run your Agent
     results_log = []
     answers_payload = []
 # --- Build Gradio Interface using Blocks ---
+with gr.Blocks(theme=gr.themes.Soft()) as demo:
+    gr.Markdown("# 🦉 Alfred GAIA Solver - Sertifika Takip Paneli")
+    with gr.Row():
+        with gr.Column(scale=1):
+            gr.LoginButton()
+            # Sadece TEK bir buton tanımlıyoruz
+            run_button = gr.Button("🚀 Sınavı Başlat ve Gönder", variant="primary")
+        with gr.Column(scale=2):
+            # Sadece TEK bir sonuç kutusu
+            status_output = gr.Textbox(label="📊 Güncel Skor ve Durum", lines=5)
+    # Alfred'in ne yaptığını görmek istersen bu kalsın, istemezsen silebilirsin.
+    # Ama şu an fonksiyonumuz 2 çıktı verdiği için bunu 'outputs' listesine eklemiyoruz.
+    agent_logs = gr.Textbox(label="🧠 Alfred'in İşlem Akışı", lines=10, interactive=False, visible=False)
+    # Sadece TEK bir tablo
+    results_table = gr.DataFrame(label="📝 Cevaplanan Sorular")
+    # TEK BİR TIKLAMA OLAYI (Senin fonksiyonun 2 veri döndürdüğü için 2 çıktı yazdık)
     run_button.click(
         fn=run_and_submit_all,
         outputs=[status_output, results_table]