Spaces:
Sleeping
Sleeping
Update agent.py
Browse files
agent.py
CHANGED
|
@@ -142,7 +142,7 @@ class BasicAgent:
|
|
| 142 |
model=model,
|
| 143 |
tools=tools,
|
| 144 |
add_base_tools=False,
|
| 145 |
-
max_steps=
|
| 146 |
)
|
| 147 |
self.agent.system_prompt = (
|
| 148 |
"""
|
|
@@ -186,20 +186,4 @@ class BasicAgent:
|
|
| 186 |
|
| 187 |
return final_str
|
| 188 |
|
| 189 |
-
def evaluate_random_questions(self, csv_path: str = "gaia_qa.csv", sample_size: int = 3):
|
| 190 |
-
df = pd.read_csv(csv_path)
|
| 191 |
-
if not {"question", "answer"}.issubset(df.columns):
|
| 192 |
-
print("CSV must contain 'question' and 'answer' columns.")
|
| 193 |
-
print("Found columns:", df.columns.tolist())
|
| 194 |
-
return
|
| 195 |
-
samples = df.sample(n=sample_size)
|
| 196 |
-
for _, row in samples.iterrows():
|
| 197 |
-
question = row["question"].strip()
|
| 198 |
-
expected = f"FINAL ANSWER: {str(row['answer']).strip()}"
|
| 199 |
-
result = self(question).strip()
|
| 200 |
-
print("---")
|
| 201 |
-
print("Question:", question)
|
| 202 |
-
print("Expected:", expected)
|
| 203 |
-
print("Agent:", result)
|
| 204 |
-
print("Correct:", expected == result)
|
| 205 |
|
|
|
|
| 142 |
model=model,
|
| 143 |
tools=tools,
|
| 144 |
add_base_tools=False,
|
| 145 |
+
max_steps=10,
|
| 146 |
)
|
| 147 |
self.agent.system_prompt = (
|
| 148 |
"""
|
|
|
|
| 186 |
|
| 187 |
return final_str
|
| 188 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 189 |
|