Spaces:
Sleeping
Sleeping
| { | |
| "id": 58, | |
| "subset": "Hand-Crafted", | |
| "mistake_step": 1, | |
| "question": "Your question here - what task is the agent trying to solve?", | |
| "agent": "Primary_Agent_Name", | |
| "agents": [ | |
| "Agent1", | |
| "Agent2", | |
| "Agent3" | |
| ], | |
| "trace": "[\n {\n \"content\": \"System prompt or initial instruction\",\n \"name\": \"System\",\n \"role\": \"system\"\n },\n {\n \"content\": \"User's question or task description\",\n \"name\": \"User\",\n \"role\": \"user\"\n },\n {\n \"content\": \"Agent's response or action\",\n \"name\": \"Agent_Name\",\n \"role\": \"assistant\"\n },\n {\n \"content\": \"Follow-up interaction or error\",\n \"name\": \"Agent_Name\",\n \"role\": \"assistant\"\n }\n]", | |
| "is_correct": false, | |
| "question_id": "84c5fae2-0bad-47f2-87f5-61bd66ab3a84", | |
| "ground_truth": "The correct answer or expected result", | |
| "mistake_agent": "Agent_Name", | |
| "mistake_reason": "Specific reason why the agent failed - be descriptive" | |
| } |