Spaces:
Sleeping
Sleeping
neznib
commited on
Commit
·
8dffb1d
1
Parent(s):
5f67055
test run
Browse files
app.py
CHANGED
|
@@ -24,7 +24,20 @@ class BasicAgent:
|
|
| 24 |
# fixed_answer = r'{"task_id": "task_id_1", "model_answer": "Between 2000 and 2009 (inclusive), Mercedes Sosa published three studio albums: Corazón Libre (2005), Cantora 1 (2009), and Cantora 2 (2009).", "reasoning_trace": "The different steps by which your model reached answer 1"}{"task_id": "task_id_2", "model_answer": "Answer 2 from your model", "reasoning_trace": "The different steps by which your model reached answer 2"}'
|
| 25 |
#fixed_answer = "I need to find how many studio albums Mercedes Sosa published between 2000 and 2009, inclusive. From the provided list: 2005: Corazón Libre, 2009: Cantora 1 and 2009: Cantora 2. There are three albums within the specified range. FINAL ANSWER: 3"
|
| 26 |
#print(f"Agent returning fixed answer: {fixed_answer}")
|
| 27 |
-
fixed_answer = self.model.invoke([("system", "You are
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 28 |
|
| 29 |
return fixed_answer.content
|
| 30 |
|
|
|
|
| 24 |
# fixed_answer = r'{"task_id": "task_id_1", "model_answer": "Between 2000 and 2009 (inclusive), Mercedes Sosa published three studio albums: Corazón Libre (2005), Cantora 1 (2009), and Cantora 2 (2009).", "reasoning_trace": "The different steps by which your model reached answer 1"}{"task_id": "task_id_2", "model_answer": "Answer 2 from your model", "reasoning_trace": "The different steps by which your model reached answer 2"}'
|
| 25 |
#fixed_answer = "I need to find how many studio albums Mercedes Sosa published between 2000 and 2009, inclusive. From the provided list: 2005: Corazón Libre, 2009: Cantora 1 and 2009: Cantora 2. There are three albums within the specified range. FINAL ANSWER: 3"
|
| 26 |
#print(f"Agent returning fixed answer: {fixed_answer}")
|
| 27 |
+
fixed_answer = self.model.invoke([("system", """You are tasked with answering questions from the GAIA benchmark for AI agents.
|
| 28 |
+
|
| 29 |
+
Provide ONLY the precise answer to the question. Do not include explanations, reasoning, or any additional text. Be direct, specific, and concise to meet the strict exact-matching requirements of the GAIA benchmark.
|
| 30 |
+
|
| 31 |
+
# Output Format
|
| 32 |
+
|
| 33 |
+
- **Single-word or short-phrase answers:** If the question necessitates a brief answer, provide just that word or phrase.
|
| 34 |
+
- **Numerical values:** Provide only the number when applicable, with no additional formatting or units unless specifically requested.
|
| 35 |
+
- **Full sentences:** If the question expects a sentence, provide the exact sentence required with no extra characters, punctuation, or formatting.
|
| 36 |
+
|
| 37 |
+
# Notes
|
| 38 |
+
|
| 39 |
+
- Be aware of strict exact-matching requirements; even minor deviations can result in an incorrect response.
|
| 40 |
+
- If any ambiguity exists in the phrasing of the input, respond with an answer that aligns with the GAIA benchmark's intended interpretation."""), ("user", question)])
|
| 41 |
|
| 42 |
return fixed_answer.content
|
| 43 |
|