Final_Assignment_Template

Sleeping

App Files Files Community

ForestRabbit commited on May 6, 2025

Commit

c248959

verified ·

1 Parent(s): 5091518

Update agent.py

Browse files

Files changed (1) hide show

agent.py +28 -52

agent.py CHANGED Viewed

@@ -94,64 +94,40 @@ class Agent:
         type_prefix = f"[Task Type: {task_type.upper()}]\n\n"
         system_prompt = (
-            "You are a member of a multidisciplinary research institute, tackling complex and ambiguous problems across knowledge, reasoning, and vision.\n\n"
-            "You have access to tools like search engines, calculators, and data analysis environments. Your task is to solve the following question carefully and completely.\n\n"
-            "You must:\n"
-            "- Think step by step, and write down all reasoning.\n"
-            "- If information is missing, use what you know and search if needed.\n"
-            "- If you encounter a file, inspect its content and extract relevant information.\n"
-            "- Use available tools only when needed, but do not rely on them blindly.\n"
-            "- If a tool does not return the final answer, analyze the result and continue reasoning.\n\n"
-            "Always:\n"
-            "- Confirm that your answer satisfies the constraints (e.g., format, brevity, units).\n"
-            "- Answer in one English sentence only, with no explanation.\n"
-            "- If the question has a strict required output format, follow it exactly.\n"
-            "- **Examples: JSON key-value, comma-separated lists, IOC country codes, etc.**\n"
-            "- When in doubt, re-read the question and match the required format.\n"
-            "- Do not end your output until you're confident your answer is final and complete.\n\n"
-            "---\n\n"
-            "📌 Advice on Tools and Reasoning:\n"
-            "If the task involves mathematical reasoning or data transformation, consider writing and executing a short Python snippet using the Calculator tool.\n"
-            "Advisory: The problem setter may have intentionally included code or files that appear unreadable or confusing. If that happens, saying \"I cannot read this\" is not the correct answer — \"finding an alternative approach\" is. This may apply to Python, HTML, JSON, SQL, or other formats.\n\n"
-            "If a file is provided:\n"
-            "- For `.csv`, `.tsv`, `.xlsx`: Assume a spreadsheet or table is loaded. Use it to find sums, counts, or specific values. Refer to column names or rows where applicable.\n"
-            "- For `.json`, `.jsonl`: Treat it as structured data. Parse keys, values, or lists. Count or extract as needed.\n"
-            "- For `.doc`, `.docx`: Assume it's a document with paragraphs. Look for keywords, names, or sections.\n"
-            "- For `.pdf`: Treat it as text with pagination. Skim the content summary and extract relevant statements or facts.\n"
-            "Advisory: The problem setter may intentionally leave broken files, folders, or links to increase difficulty. Do not simply return 'unreadable'. Your task is to consider alternative strategies and try to reason around missing content.\n\n"
-            "---\n\n"
-            "Now solve the following task as best as possible. Do not skip steps. Think hard. Use all your skills and tools. Good luck.\n\n"
         )
         file_summary = ""
         try:
-            if file_names:
-                file_path = f"/home/user/app/files/{task_id}/{file_names[0]}"
                 ext = Path(file_path).suffix.lower()
-                if ext in [".csv", ".tsv"]:
-                    df = pd.read_csv(file_path)
-                    file_summary = f"The following table has been loaded with {df.shape[0]} rows and {df.shape[1]} columns:\n{df.head(3).to_string(index=False)}"
-                elif ext == ".xlsx":
-                    df = pd.read_excel(file_path)
-                    file_summary = f"The following spreadsheet has been loaded with {df.shape[0]} rows and {df.shape[1]} columns:\n{df.head(3).to_string(index=False)}"
-                elif ext in [".json", ".jsonl"]:
-                    with open(file_path, "r", encoding="utf-8") as f:
-                        if ext == ".jsonl":
-                            data = [json.loads(line) for line in f if line.strip()]
-                        else:
-                            data = json.load(f)
-                    file_summary = f"The following JSON data was loaded ({len(data)} items)."
-                elif ext == ".docx":
-                    doc = Document(file_path)
-                    text = "\n".join([para.text for para in doc.paragraphs])
-                    file_summary = f"Extracted text from DOCX ({len(text)} characters)."
-                elif ext == ".pdf":
-                    doc = fitz.open(file_path)
-                    text = "".join([page.get_text() for page in doc])
-                    file_summary = f"Extracted text from PDF ({len(doc)} pages, {len(text)} characters)."
-                else:
-                    file_summary = "(Unsupported file type — skipping file content.)"
             full_prompt = type_prefix + system_prompt + file_summary + f"\n\nTASK:\n{question}"
             result = self.agent.run(full_prompt)
             return result.strip()

         type_prefix = f"[Task Type: {task_type.upper()}]\n\n"
         system_prompt = (
+            "You are a member of a multidisciplinary research institute... [truncated for brevity, kept same]"
         )
         file_summary = ""
         try:
+            summaries = []
+            for fname in file_names:
+                file_path = f"/home/user/app/files/{task_id}/{fname}"
                 ext = Path(file_path).suffix.lower()
+                try:
+                    if ext in [".csv", ".tsv"]:
+                        df = pd.read_csv(file_path)
+                        summaries.append(f"Loaded {fname} with {df.shape[0]} rows and {df.shape[1]} columns:\n{df.head(3).to_string(index=False)}")
+                    elif ext == ".xlsx":
+                        df = pd.read_excel(file_path)
+                        summaries.append(f"Loaded {fname} with {df.shape[0]} rows and {df.shape[1]} columns:\n{df.head(3).to_string(index=False)}")
+                    elif ext in [".json", ".jsonl"]:
+                        with open(file_path, "r", encoding="utf-8") as f:
+                            data = [json.loads(line) for line in f if line.strip()] if ext == ".jsonl" else json.load(f)
+                        summaries.append(f"Loaded JSON data from {fname} ({len(data)} entries)")
+                    elif ext == ".docx":
+                        doc = Document(file_path)
+                        text = "\n".join([para.text for para in doc.paragraphs])
+                        summaries.append(f"Extracted text from DOCX {fname} ({len(text)} characters)")
+                    elif ext == ".pdf":
+                        doc = fitz.open(file_path)
+                        text = "".join([page.get_text() for page in doc])
+                        summaries.append(f"Extracted text from PDF {fname} ({len(doc)} pages, {len(text)} characters)")
+                    else:
+                        summaries.append(f"{fname}: Unsupported file type {ext}")
+                except Exception as fe:
+                    summaries.append(f"{fname}: ERROR reading file ({fe})")
+            file_summary = "\n\n".join(summaries)
             full_prompt = type_prefix + system_prompt + file_summary + f"\n\nTASK:\n{question}"
             result = self.agent.run(full_prompt)
             return result.strip()