Spaces:

gabejavitt
/

agentCourse

Sleeping

App Files Files Community

gabejavitt commited on Oct 29, 2025

Commit

54c602c

verified ·

1 Parent(s): 9cdc007

Update app.py

Browse files

Files changed (1) hide show

app.py +66 -12

app.py CHANGED Viewed

@@ -13,6 +13,9 @@ import re
 import uuid
 import time
 # --- Multimodal & Web Tool Imports ---
 from transformers import pipeline
 from youtube_transcript_api import YouTubeTranscriptApi
@@ -61,7 +64,10 @@ agent = None
 # ====================================================
 # --- Tool Definitions ---
-@tool
 def search_tool(query: str) -> str:
     """Calls DuckDuckGo search and returns the results. Use this for recent information or general web searches."""
     if not isinstance(query, str) or not query.strip():
@@ -78,7 +84,10 @@ def search_tool(query: str) -> str:
         return f"Error running search for '{query}': {str(e)}"
-@tool
 def code_interpreter(code: str) -> str:
     """
     Executes a string of Python code and returns its stdout, stderr, and any error.
@@ -132,7 +141,10 @@ def code_interpreter(code: str) -> str:
         return f"Execution failed:\n{tb_str}"
-@tool
 def read_file(path: str) -> str:
     """Reads the content of a file at the specified path. Use this to examine uploaded files or files you've created."""
     if not isinstance(path, str) or not path.strip():
@@ -186,7 +198,11 @@ def read_file(path: str) -> str:
         return f"Unexpected error accessing file '{path}': {str(e)}"
-@tool
 def write_file(path: str, content: str) -> str:
     """Writes content to a file at the specified path. Creates directories if needed."""
     if not isinstance(path, str) or not path.strip():
@@ -213,7 +229,10 @@ def write_file(path: str, content: str) -> str:
         return f"Error writing file '{path}': {str(e)}"
-@tool
 def list_directory(path: str = ".") -> str:
     """Lists the contents of a directory. Useful for finding available files."""
     if not isinstance(path, str):
@@ -254,7 +273,10 @@ def list_directory(path: str = ".") -> str:
         return f"Error listing directory '{path}': {str(e)}"
-@tool
 def audio_transcription_tool(file_path: str) -> str:
     """Transcribes an audio file (mp3, wav, etc.) to text using Whisper."""
     if not isinstance(file_path, str) or not file_path.strip():
@@ -300,7 +322,10 @@ def audio_transcription_tool(file_path: str) -> str:
         return f"Error transcribing '{file_path}': {str(e)}"
-@tool
 def get_youtube_transcript(video_url: str) -> str:
     """Fetches the transcript/captions for a YouTube video."""
     if not isinstance(video_url, str) or not video_url.strip():
@@ -335,7 +360,11 @@ def get_youtube_transcript(video_url: str) -> str:
 # --- NEW RAG-BASED SCRAPER TOOL ---
-@tool
 def scrape_and_retrieve(url: str, query: str) -> str:
     """
     Scrapes a webpage, chunks its content, and performs a RAG (Retrieval-Augmented Generation)
@@ -401,7 +430,10 @@ def scrape_and_retrieve(url: str, query: str) -> str:
         return f"Error scraping or retrieving from {url}: {str(e)}\n{tb_str}"
-@tool
 def final_answer_tool(answer: str) -> str:
     """
     Call this tool ONLY when you have the final, definitive answer.
@@ -500,7 +532,17 @@ class BasicAgent:
         # Build tool descriptions
         tool_desc_list = []
         for tool in self.tools:
-            desc = f"- {tool.name}: {tool.description}"
             tool_desc_list.append(desc)
         tool_descriptions = "\n".join(tool_desc_list)
@@ -656,6 +698,10 @@ Current Chat History:
                         )
                     time.sleep(2 ** attempt)
             if ai_message.tool_calls:
                  print(f"🔧 Executor Tool Call: {ai_message.tool_calls[0]['name']}")
             else:
@@ -775,6 +821,11 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
     agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main" if space_id else "local_run"
     print(f"Agent code URL: {agent_code}")
     print("--- USING MOCK QUESTIONS ---")
     mock_questions_data = [
         {
             "task_id": "mock_level1_001",
@@ -857,6 +908,7 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
             "question": r"""As of August 2023, how many in-text citations on the West African Vodun Wikipedia page reference a source that was cited using Scopus?"""
         }
     ]
     questions_data = mock_questions_data
     print(f"Using {len(questions_data)} mock questions.")
@@ -891,7 +943,7 @@ def run_and_submit_all( profile: gr.OAuthProfile | None):
     status_update = f"Finished mock run. Processed {len(answers_payload)} answers for '{username}'."
     print(status_update); print("--- MOCK RUN - SUBMISSION SKIPPED ---")
-    final_status = "--- MOCK RUN COMPLETE ---\n" + status_update + "\nSubmission SKIPPED."
     results_df = pd.DataFrame(results_log); results_df['Correct'] = 'N/A (Mock)'
     return final_status, results_df
@@ -911,7 +963,7 @@ with gr.Blocks() as demo:
 if __name__ == "__main__":
     print("\n" + "-"*30 + " App Starting " + "-"*30)
-    space_host_startup = os.getenv("SPACE_HOST"); space_id_startup = os.getenv("SPACE_ID")
     if space_host_startup: print(f"✅ SPACE_HOST: {space_host_startup}\n   Runtime URL: https://{space_host_startup}.hf.space")
     else: print("ℹ️ No SPACE_HOST (local?).")
     if space_id_startup: print(f"✅ SPACE_ID: {space_id_startup}\n   Repo URL: https://huggingface.co/spaces/{space_id_startup}\n   Tree URL: https://huggingface.co/spaces/{space_id_startup}/tree/main")
@@ -925,3 +977,5 @@ if __name__ == "__main__":
     print("-"*(60 + len(" App Starting ")) + "\n")
     print("Launching Gradio Interface...")
     demo.queue().launch(debug=True, share=False)

 import uuid
 import time
+# --- Pydantic Import ---
+from pydantic import BaseModel, Field
 # --- Multimodal & Web Tool Imports ---
 from transformers import pipeline
 from youtube_transcript_api import YouTubeTranscriptApi
 # ====================================================
 # --- Tool Definitions ---
+class SearchInput(BaseModel):
+    query: str = Field(description="The search query.")
+@tool(args_schema=SearchInput)
 def search_tool(query: str) -> str:
     """Calls DuckDuckGo search and returns the results. Use this for recent information or general web searches."""
     if not isinstance(query, str) or not query.strip():
         return f"Error running search for '{query}': {str(e)}"
+class CodeInput(BaseModel):
+    code: str = Field(description="The Python code to execute, which must include a print() statement for output.")
+@tool(args_schema=CodeInput)
 def code_interpreter(code: str) -> str:
     """
     Executes a string of Python code and returns its stdout, stderr, and any error.
         return f"Execution failed:\n{tb_str}"
+class ReadFileInput(BaseModel):
+    path: str = Field(description="The path to the file to read.")
+@tool(args_schema=ReadFileInput)
 def read_file(path: str) -> str:
     """Reads the content of a file at the specified path. Use this to examine uploaded files or files you've created."""
     if not isinstance(path, str) or not path.strip():
         return f"Unexpected error accessing file '{path}': {str(e)}"
+class WriteFileInput(BaseModel):
+    path: str = Field(description="The path of the file to write to.")
+    content: str = Field(description="The content to write into the file.")
+@tool(args_schema=WriteFileInput)
 def write_file(path: str, content: str) -> str:
     """Writes content to a file at the specified path. Creates directories if needed."""
     if not isinstance(path, str) or not path.strip():
         return f"Error writing file '{path}': {str(e)}"
+class ListDirInput(BaseModel):
+    path: str = Field(description="The directory path to list.", default=".")
+@tool(args_schema=ListDirInput)
 def list_directory(path: str = ".") -> str:
     """Lists the contents of a directory. Useful for finding available files."""
     if not isinstance(path, str):
         return f"Error listing directory '{path}': {str(e)}"
+class AudioInput(BaseModel):
+    file_path: str = Field(description="The file path of the audio to transcribe.")
+@tool(args_schema=AudioInput)
 def audio_transcription_tool(file_path: str) -> str:
     """Transcribes an audio file (mp3, wav, etc.) to text using Whisper."""
     if not isinstance(file_path, str) or not file_path.strip():
         return f"Error transcribing '{file_path}': {str(e)}"
+class YoutubeInput(BaseModel):
+    video_url: str = Field(description="The URL of the YouTube video.")
+@tool(args_schema=YoutubeInput)
 def get_youtube_transcript(video_url: str) -> str:
     """Fetches the transcript/captions for a YouTube video."""
     if not isinstance(video_url, str) or not video_url.strip():
 # --- NEW RAG-BASED SCRAPER TOOL ---
+class ScrapeInput(BaseModel):
+    url: str = Field(description="The URL to scrape (must start with http:// or https://).")
+    query: str = Field(description="The specific question to answer or information to find on the page.")
+@tool(args_schema=ScrapeInput)
 def scrape_and_retrieve(url: str, query: str) -> str:
     """
     Scrapes a webpage, chunks its content, and performs a RAG (Retrieval-Augmented Generation)
         return f"Error scraping or retrieving from {url}: {str(e)}\n{tb_str}"
+class FinalAnswerInput(BaseModel):
+    answer: str = Field(description="The final, definitive answer to the question.")
+@tool(args_schema=FinalAnswerInput)
 def final_answer_tool(answer: str) -> str:
     """
     Call this tool ONLY when you have the final, definitive answer.
         # Build tool descriptions
         tool_desc_list = []
         for tool in self.tools:
+            # Use Pydantic schema if available for richer descriptions
+            if tool.args_schema:
+                schema = tool.args_schema.schema()
+                args_desc = []
+                for prop, details in schema.get('properties', {}).items():
+                    desc = details.get('description', '')
+                    args_desc.append(f"  - {prop}: {desc}")
+                args_str = "\n".join(args_desc)
+                desc = f"- {tool.name}:\n  {tool.description}\n  Args:\n{args_str}"
+            else:
+                desc = f"- {tool.name}: {tool.description}"
             tool_desc_list.append(desc)
         tool_descriptions = "\n".join(tool_desc_list)
                         )
                     time.sleep(2 ** attempt)
+            # +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
+            # --- FALLBACK LOGIC REMOVED AS REQUESTED ---
+            # +++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++
             if ai_message.tool_calls:
                  print(f"🔧 Executor Tool Call: {ai_message.tool_calls[0]['name']}")
             else:
     agent_code = f"https://huggingface.co/spaces/{space_id}/tree/main" if space_id else "local_run"
     print(f"Agent code URL: {agent_code}")
     print("--- USING MOCK QUESTIONS ---")
+    # --- MOCK QUESTIONS ---
+    #
+    # vvv  PASTE YOUR FULL LIST OF 20 MOCK QUESTIONS HERE  vvv
+    #
     mock_questions_data = [
         {
             "task_id": "mock_level1_001",
             "question": r"""As of August 2023, how many in-text citations on the West African Vodun Wikipedia page reference a source that was cited using Scopus?"""
         }
     ]
     questions_data = mock_questions_data
     print(f"Using {len(questions_data)} mock questions.")
     status_update = f"Finished mock run. Processed {len(answers_payload)} answers for '{username}'."
     print(status_update); print("--- MOCK RUN - SUBMISSION SKIPPED ---")
+    final_.status = "--- MOCK RUN COMPLETE ---\n" + status_update + "\nSubmission SKIPPED."
     results_df = pd.DataFrame(results_log); results_df['Correct'] = 'N/A (Mock)'
     return final_status, results_df
 if __name__ == "__main__":
     print("\n" + "-"*30 + " App Starting " + "-"*30)
+    space_host_startup = os.getenv("SPACE_ID"); space_id_startup = os.getenv("SPACE_ID")
     if space_host_startup: print(f"✅ SPACE_HOST: {space_host_startup}\n   Runtime URL: https://{space_host_startup}.hf.space")
     else: print("ℹ️ No SPACE_HOST (local?).")
     if space_id_startup: print(f"✅ SPACE_ID: {space_id_startup}\n   Repo URL: https://huggingface.co/spaces/{space_id_startup}\n   Tree URL: https://huggingface.co/spaces/{space_id_startup}/tree/main")
     print("-"*(60 + len(" App Starting ")) + "\n")
     print("Launching Gradio Interface...")
     demo.queue().launch(debug=True, share=False)