Spaces:

doxiy
/

exam-agent

Sleeping

doxiy commited on Jun 2, 2025

Commit

c098b65

1 Parent(s): b8de053

version complète v09

Files changed (3) hide show

agent.py CHANGED Viewed

@@ -11,27 +11,13 @@ load_dotenv()
 openai_api_key = os.getenv("OPENAI_API_KEY")
 os.environ["OPENAI_API_KEY"] = openai_api_key
 # 🧠 Création de l'agent
 llm = OpenAI(
     model="gpt-3.5-turbo",
-    system_prompt=("""
-            You are a GAIA benchmark agent.
-            RULES:
-            - Respond ONLY with the final answer.
-            - Do NOT include explanations, reasoning, full sentences, or labels like "Answer:".
-            - If the answer is a number, respond with the number alone.
-            - If the answer is a word or phrase, write it exactly.
-            - Never repeat the question.
-            Examples:
-            "How many albums?" → 4
-            "What surname?" → Smith
-            "Which country?" → France
-                   """
-    ),
     max_tokens=1500,
     temperature=0.1
 )

 openai_api_key = os.getenv("OPENAI_API_KEY")
 os.environ["OPENAI_API_KEY"] = openai_api_key
+with open("prompt.txt", "r", encoding="utf-8") as f:
+    my_prompt = f.read()
 # 🧠 Création de l'agent
 llm = OpenAI(
     model="gpt-3.5-turbo",
+    system_prompt=(my_prompt),
     max_tokens=1500,
     temperature=0.1
 )

prompt.txt ADDED Viewed

+system_prompt = """
+# GAIA Benchmark Agent
+You are an expert research agent for GAIA benchmark questions.
+## MANDATORY WORKFLOW
+1. **ALWAYS use available tools** to research and find information
+2. **NEVER say "I cannot answer"** - always attempt to use tools first
+3. **Use web_search for ALL factual questions** that require current information
+4. **Try multiple search approaches** if the first search doesn't give good results
+## OUTPUT FORMAT RULES
+- Respond with ONLY the final answer
+- No explanations, no reasoning, no "Answer:" labels
+- If number → just the number: `4`
+- If word/name → just the word: `Smith`
+- If list → comma-separated: `a,b,c` (no spaces after commas)
+- If country code → just the code: `USA`
+## Examples
+- Question: "How many albums did X release?" → `4`
+- Question: "What is the surname of Y?" → `Johnson`
+- Question: "List the vegetables:" → `broccoli,celery,lettuce`
+## CRITICAL RULE
+**ALWAYS use tools before responding. NEVER give up without trying.**
+"""

test.py CHANGED Viewed

@@ -16,7 +16,7 @@ except Exception as e:
     print(f"❌ Erreur DuckDuckGo: {e}")
 # Testez avec une question simple
-question_test =  "How many studio albums were published by Mercedes Sosa between 2000 and 2009 , 2009 included?"
 expected_type = detect_answer_type(question_test)
 print(expected_type)

     print(f"❌ Erreur DuckDuckGo: {e}")
 # Testez avec une question simple
+question_test =  "How many studio albums were published by Mercedes Sosa between 2000 and 2009 (included)? You can use the latest 2022 version of english wikipedia."
 expected_type = detect_answer_type(question_test)
 print(expected_type)