Agent_Course_Final_Assignment

Sleeping

App Files Files Community

Wen-ChuangChou commited on Jun 27, 2025

Commit

1729ab6

1 Parent(s): cee706e

Add using Gemeni Model

Browse files

Files changed (3) hide show

.gitignore +2 -1
agent.py +314 -0
app.py +2 -165

.gitignore CHANGED Viewed

@@ -1,2 +1,3 @@
 .env
-*pycache*

 .env
+*pycache*
+results/

agent.py ADDED Viewed

	@@ -0,0 +1,314 @@

+import json
+import os
+import requests
+import sys
+import time
+from datetime import datetime
+from dotenv import load_dotenv
+from typing import Dict, List, Any
+from smolagents import DuckDuckGoSearchTool, OpenAIServerModel, CodeAgent, ActionStep, TaskStep
+from blablador import Models
+load_dotenv()
+class BasicAgent:
+    def __init__(self,
+                 model_provider: str = "Blablador",
+                 memory_file: str = "agent_memory.json"):
+        self.model_provider = model_provider
+        self.memory_file = memory_file
+        if model_provider == "Blablador":
+            models = Models(
+                api_key=os.getenv("Blablador_API_KEY")).get_model_ids()
+            model_id_blablador = 5
+            model_name = " ".join(
+                models[model_id_blablador].split(" - ")[1].split()[:2])
+            print("The agent uses the following model:", model_name)
+            answer_llm = OpenAIServerModel(
+                model_id=models[model_id_blablador],
+                api_base="https://helmholtz-blablador.fz-juelich.de:8000/v1",
+                api_key=os.getenv("Blablador_API_KEY"),
+                flatten_messages_as_text=True,
+                temperature=0.2)
+        elif model_provider == "Gemini":
+            # model_name = "gemini-2.5-flash-preview-05-20"
+            model_name = "gemini-2.0-flash"
+            print("The agent uses the following model:", model_name)
+            answer_llm = OpenAIServerModel(
+                model_id=model_name,
+                api_base=
+                "https://generativelanguage.googleapis.com/v1beta/openai/",
+                api_key=os.getenv("Gemini_API_KEY2"),
+                temperature=0.2)
+        else:
+            print(
+                f"Error: Unsupported model provider '{model_provider}'. Only 'Blablador' and 'Gemini' are supported."
+            )
+            sys.exit(1)
+        self.agent = CodeAgent(
+            tools=[DuckDuckGoSearchTool()],
+            model=answer_llm,
+            planning_interval=3,
+            max_steps=10,
+            # verbosity_level=LogLevel.ERROR,
+        )
+    def __call__(self,
+                 question: str,
+                 task_id: str = "",
+                 file_url: str = "",
+                 file_ext: str = "") -> str:
+        print(f"Agent received question (first 50 chars): {question[:50]}...")
+        SYSTEM_PROMPT = """You are a general AI assistant. I will ask you a question.
+        Report your thoughts, and finish your answer with the following template: FINAL ANSWER: [YOUR FINAL ANSWER].
+        YOUR FINAL ANSWER should be a number OR as few words as possible OR a comma separated list of numbers and/or strings.
+        If you are asked for a number, don't use comma to write your number
+        neither use units such as $ or percent sign unless specified otherwise.
+        If you are asked for a string, don't use articles, neither abbreviations, (e.g. for cities),
+        and write the digits in plain text unless specified otherwise.
+        If you are asked for a comma separated list,
+        apply the above rules depending of whether the element to be put in the list is a number or a string.
+        """
+        # Prepare additional_args for file handling
+        additional_args = {}
+        # Handle file if provided
+        if file_url:
+            # print(f"Downloading file from: {file_url}")
+            # file_content = self._download_file(file_url, file_ext)
+            # if file_content is not None:
+            #     # Give the file a clear name based on its extension
+            #     if file_ext.lower() == 'csv':
+            #         # For CSV files, try to load as DataFrame
+            #         try:
+            #             import io
+            #             if isinstance(file_content, str):
+            #                 df = pd.read_csv(io.StringIO(file_content))
+            #             else:
+            #                 df = pd.read_csv(io.BytesIO(file_content))
+            #             additional_args['dataframe'] = df
+            #             additional_args['csv_file'] = file_content
+            #             print(f"Loaded CSV file with shape: {df.shape}")
+            #         except Exception as e:
+            #             print(f"Could not parse CSV file: {e}")
+            #             additional_args['file_content'] = file_content
+            #     elif file_ext.lower() in ['json']:
+            #         try:
+            #             import json
+            #             if isinstance(file_content, bytes):
+            #                 file_content = file_content.decode('utf-8')
+            #             json_data = json.loads(file_content)
+            #             additional_args['json_data'] = json_data
+            #             additional_args['file_content'] = file_content
+            #             print(f"Loaded JSON file")
+            #         except Exception as e:
+            #             print(f"Could not parse JSON file: {e}")
+            #             additional_args['file_content'] = file_content
+            #     else:
+            #         # For other file types, just pass the content
+            #         additional_args['file_content'] = file_content
+            #         if file_ext:
+            #             additional_args['file_extension'] = file_ext
+            #         print(f"Loaded {file_ext} file")
+            # Update the prompt to mention the file
+            # full_prompt = f"{SYSTEM_PROMPT}\n\nQuestion: {question}\n\nNote: A {file_ext} file has been provided and is available for your analysis."
+            additional_args = f"{file_url}_{file_ext}"
+            full_prompt = f"{SYSTEM_PROMPT}\n\nQuestion: {question}\n\nNote: A {file_ext} file has been provided and is available for your analysis."
+            # else:
+            # full_prompt = f"{SYSTEM_PROMPT}\n\nQuestion: {question}\n\nNote: Could not retrieve the file from {file_url}."
+        else:
+            full_prompt = f"{SYSTEM_PROMPT}\n\nQuestion: {question}"
+        # # Combine system prompt with the user question
+        # full_prompt = f"{SYSTEM_PROMPT}\n\nQuestion: {question}"
+        try:
+            answer = self.agent.run(full_prompt)
+            # answer = self.agent.run(
+            #     task=full_prompt,
+            #     additional_args=additional_args if additional_args else None)
+            print(f"Agent returning answer: {answer}")
+            # Export memory after execution
+            self.export_memory_to_json(task_id=task_id,
+                                       question=question,
+                                       answer=answer)
+            # Sleep for 10 seconds if using Gemini to avoid rate limiting
+            if self.model_provider == "Gemini":
+                time.sleep(10)
+            return answer
+        except Exception as e:
+            print(f"Error running agent: {e}")
+            return f"Error: {e}"
+    def export_memory_to_json(self,
+                              task_id: str = "",
+                              question: str = "",
+                              answer: str = "",
+                              error: str = ""):
+        """Export agent's memory to JSON file for each question"""
+        memory_data = self.extract_memory_data()
+        # Load existing memory file if it exists
+        if os.path.exists(self.memory_file):
+            with open(self.memory_file, 'r', encoding='utf-8') as f:
+                existing_data = json.load(f)
+        else:
+            existing_data = {"questions": [], "batch_info": {}}
+        # Create question data
+        question_data = {
+            "question_id": task_id or len(existing_data["questions"]) + 1,
+            "timestamp": datetime.now().isoformat(),
+            "model_provider": self.model_provider,
+            "task": question,
+            "result": answer,
+            "error": error,
+            "memory": memory_data,
+            "memory_stats": self.get_memory_stats()
+        }
+        # Add or update question
+        if task_id:
+            # Check if question_id already exists and update it
+            question_exists = False
+            for i, existing_question in enumerate(existing_data["questions"]):
+                if existing_question["question_id"] == task_id:
+                    existing_data["questions"][i] = question_data
+                    question_exists = True
+                    break
+            if not question_exists:
+                existing_data["questions"].append(question_data)
+        else:
+            existing_data["questions"].append(question_data)
+        # Update batch info
+        existing_data["batch_info"] = {
+            "total_questions": len(existing_data["questions"]),
+            "last_updated": datetime.now().isoformat(),
+            "model_provider": self.model_provider
+        }
+        # Save to file
+        with open(self.memory_file, 'w', encoding='utf-8') as f:
+            json.dump(existing_data,
+                      f,
+                      indent=2,
+                      ensure_ascii=False,
+                      default=str)
+        print(f"Memory for question {task_id} exported to {self.memory_file}")
+    def extract_memory_data(self) -> Dict[str, Any]:
+        """Extract memory data from agent"""
+        memory_data = {"system_prompt": None, "steps": [], "full_steps": []}
+        # Get system prompt
+        if hasattr(self.agent.memory,
+                   'system_prompt') and self.agent.memory.system_prompt:
+            memory_data["system_prompt"] = {
+                "content": str(self.agent.memory.system_prompt.system_prompt),
+                "type": "system_prompt"
+            }
+        # Get all memory steps
+        for i, step in enumerate(self.agent.memory.steps):
+            step_data = {
+                "step_index": i,
+                "step_type": type(step).__name__,
+                "timestamp": datetime.now().isoformat()
+            }
+            if isinstance(step, TaskStep):
+                step_data.update({
+                    "task":
+                    step.task,
+                    "task_images":
+                    len(step.task_images) if step.task_images else 0
+                })
+            elif isinstance(step, ActionStep):
+                step_data.update({
+                    "step_number":
+                    step.step_number,
+                    "llm_output":
+                    getattr(step, 'action', None),
+                    "observations":
+                    step.observations,
+                    "error":
+                    str(step.error) if step.error else None,
+                    "has_images":
+                    len(step.observations_images) > 0
+                    if step.observations_images else False
+                })
+            memory_data["steps"].append(step_data)
+        # Get full steps as dictionaries (as mentioned in docs)
+        try:
+            full_steps = self.agent.memory.get_full_steps()
+            memory_data["full_steps"] = full_steps
+        except Exception as e:
+            print(f"Could not get full steps: {e}")
+            memory_data["full_steps"] = []
+        return memory_data
+    def get_memory_stats(self) -> Dict[str, int]:
+        """Get statistics about the agent's memory"""
+        stats = {
+            "total_steps": len(self.agent.memory.steps),
+            "task_steps": 0,
+            "action_steps": 0,
+            "error_steps": 0,
+            "successful_steps": 0
+        }
+        for step in self.agent.memory.steps:
+            if isinstance(step, TaskStep):
+                stats["task_steps"] += 1
+            elif isinstance(step, ActionStep):
+                stats["action_steps"] += 1
+                if step.error:
+                    stats["error_steps"] += 1
+                else:
+                    stats["successful_steps"] += 1
+        return stats
+    def _download_file(self, file_url: str, file_ext: str = "") -> str:
+        """Download file content from URL and return as text or bytes"""
+        try:
+            response = requests.get(file_url, timeout=30)
+            response.raise_for_status()
+            # For text files, return as string
+            if file_ext.lower() in [
+                    'txt', 'csv', 'json', 'md', 'py', 'js', 'html', 'xml'
+            ]:
+                return response.text
+            else:
+                # For binary files, return the content as bytes
+                return response.content
+        except Exception as e:
+            print(f"Error downloading file from {file_url}: {e}")
+            return None

app.py CHANGED Viewed

@@ -3,175 +3,12 @@ import gradio as gr
 import requests
 import inspect
 import pandas as pd
-import sys
-import time
-from dotenv import load_dotenv
-from smolagents import DuckDuckGoSearchTool, OpenAIServerModel, CodeAgent, Tool
-from blablador import Models
 # (Keep Constants as is)
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
-# --- Basic Agent Definition ---
-# ----- THIS IS WERE YOU CAN BUILD WHAT YOU WANT ------
-load_dotenv()
-class BasicAgent:
-    def __init__(self, model_provider: str = "Blablador"):
-        self.model_provider = model_provider
-        if model_provider == "Blablador":
-            models = Models(
-                api_key=os.getenv("Blablador_API_KEY")).get_model_ids()
-            model_id_blablador = 5
-            model_name = " ".join(
-                models[model_id_blablador].split(" - ")[1].split()[:2])
-            print("The agent uses the following model:", model_name)
-            answer_llm = OpenAIServerModel(
-                model_id=models[model_id_blablador],
-                api_base="https://helmholtz-blablador.fz-juelich.de:8000/v1",
-                api_key=os.getenv("Blablador_API_KEY"),
-                flatten_messages_as_text=True,
-                temperature=0.2)
-        elif model_provider == "Gemini":
-            # model_name = "gemini-2.5-flash-preview-05-20"
-            model_name = "gemini-2.0-flash"
-            print("The agent uses the following model:", model_name)
-            answer_llm = OpenAIServerModel(
-                model_id=model_name,
-                api_base=
-                "https://generativelanguage.googleapis.com/v1beta/openai/",
-                api_key=os.getenv("Gemini_API_KEY2"),
-                temperature=0.2)
-        else:
-            print(
-                f"Error: Unsupported model provider '{model_provider}'. Only 'Blablador' and 'Gemini' are supported."
-            )
-            sys.exit(1)
-        self.agent = CodeAgent(
-            tools=[DuckDuckGoSearchTool()],
-            model=answer_llm,
-            planning_interval=3,
-            max_steps=10,
-            # verbosity_level=LogLevel.ERROR,
-        )
-    def __call__(self,
-                 question: str,
-                 file_url: str = "",
-                 file_ext: str = "") -> str:
-        print(f"Agent received question (first 50 chars): {question[:50]}...")
-        SYSTEM_PROMPT = """You are a general AI assistant. I will ask you a question.
-        Report your thoughts, and finish your answer with the following template: FINAL ANSWER: [YOUR FINAL ANSWER].
-        YOUR FINAL ANSWER should be a number OR as few words as possible OR a comma separated list of numbers and/or strings.
-        If you are asked for a number, don't use comma to write your number
-        neither use units such as $ or percent sign unless specified otherwise.
-        If you are asked for a string, don't use articles, neither ABBREVIATIONS, (e.g. for cities),
-        and write the digits in plain text unless specified otherwise.
-        If you are asked for a comma separated list,
-        apply the above rules depending of whether the element to be put in the list is a number or a string.
-        """
-        # Prepare additional_args for file handling
-        additional_args = {}
-        # Handle file if provided
-        if file_url:
-            # print(f"Downloading file from: {file_url}")
-            # file_content = self._download_file(file_url, file_ext)
-            # if file_content is not None:
-            #     # Give the file a clear name based on its extension
-            #     if file_ext.lower() == 'csv':
-            #         # For CSV files, try to load as DataFrame
-            #         try:
-            #             import io
-            #             if isinstance(file_content, str):
-            #                 df = pd.read_csv(io.StringIO(file_content))
-            #             else:
-            #                 df = pd.read_csv(io.BytesIO(file_content))
-            #             additional_args['dataframe'] = df
-            #             additional_args['csv_file'] = file_content
-            #             print(f"Loaded CSV file with shape: {df.shape}")
-            #         except Exception as e:
-            #             print(f"Could not parse CSV file: {e}")
-            #             additional_args['file_content'] = file_content
-            #     elif file_ext.lower() in ['json']:
-            #         try:
-            #             import json
-            #             if isinstance(file_content, bytes):
-            #                 file_content = file_content.decode('utf-8')
-            #             json_data = json.loads(file_content)
-            #             additional_args['json_data'] = json_data
-            #             additional_args['file_content'] = file_content
-            #             print(f"Loaded JSON file")
-            #         except Exception as e:
-            #             print(f"Could not parse JSON file: {e}")
-            #             additional_args['file_content'] = file_content
-            #     else:
-            #         # For other file types, just pass the content
-            #         additional_args['file_content'] = file_content
-            #         if file_ext:
-            #             additional_args['file_extension'] = file_ext
-            #         print(f"Loaded {file_ext} file")
-            # Update the prompt to mention the file
-            # full_prompt = f"{SYSTEM_PROMPT}\n\nQuestion: {question}\n\nNote: A {file_ext} file has been provided and is available for your analysis."
-            additional_args = f"{file_url}_{file_ext}"
-            full_prompt = f"{SYSTEM_PROMPT}\n\nQuestion: {question}\n\nNote: A {file_ext} file has been provided and is available for your analysis."
-            # else:
-            # full_prompt = f"{SYSTEM_PROMPT}\n\nQuestion: {question}\n\nNote: Could not retrieve the file from {file_url}."
-        else:
-            full_prompt = f"{SYSTEM_PROMPT}\n\nQuestion: {question}"
-        # # Combine system prompt with the user question
-        # full_prompt = f"{SYSTEM_PROMPT}\n\nQuestion: {question}"
-        try:
-            answer = self.agent.run(full_prompt)
-            # answer = self.agent.run(
-            #     task=full_prompt,
-            #     additional_args=additional_args if additional_args else None)
-            print(f"Agent returning answer: {answer}")
-            if self.model_provider == "Gemini":
-                time.sleep(10)
-            return answer
-        except Exception as e:
-            print(f"Error running agent: {e}")
-            return f"Error: {e}"
-    def _download_file(self, file_url: str, file_ext: str = "") -> str:
-        """Download file content from URL and return as text or bytes"""
-        try:
-            response = requests.get(file_url, timeout=30)
-            response.raise_for_status()
-            # For text files, return as string
-            if file_ext.lower() in [
-                    'txt', 'csv', 'json', 'md', 'py', 'js', 'html', 'xml'
-            ]:
-                return response.text
-            else:
-                # For binary files, return the content as bytes
-                return response.content
-        except Exception as e:
-            print(f"Error downloading file from {file_url}: {e}")
-            return None
 def run_and_submit_all(profile: gr.OAuthProfile | None):
     """
@@ -244,7 +81,7 @@ def run_and_submit_all(profile: gr.OAuthProfile | None):
             file_url = f"{api_url}/files/{task_id}"
         try:
-            submitted_answer = agent(question_text)
             # submitted_answer = agent(question_text, file_url, file_ext)
             answers_payload.append({
                 "task_id": task_id,

 import requests
 import inspect
 import pandas as pd
+from agent import BasicAgent
 # (Keep Constants as is)
 # --- Constants ---
 DEFAULT_API_URL = "https://agents-course-unit4-scoring.hf.space"
 def run_and_submit_all(profile: gr.OAuthProfile | None):
     """
             file_url = f"{api_url}/files/{task_id}"
         try:
+            submitted_answer = agent(question_text, task_id)
             # submitted_answer = agent(question_text, file_url, file_ext)
             answers_payload.append({
                 "task_id": task_id,