{"messages": [{"role": "user", "content": "What is 47 * 89?"}], "tools": [{"name": "calculator", "description": "Evaluate an arithmetic expression.", "parameters": {"type": "object", "properties": {"expression": {"type": "string"}}, "required": ["expression"]}}], "expected": {"name": "calculator", "arguments": {"expression": "47*89"}}, "expected_output": "{\"name\": \"calculator\", \"arguments\": {\"expression\": \"47*89\"}}"}
{"messages": [{"role": "user", "content": "What's the square root of 1764?"}], "tools": [{"name": "calculator", "description": "Evaluate an arithmetic expression.", "parameters": {"type": "object", "properties": {"expression": {"type": "string"}}, "required": ["expression"]}}], "expected": {"name": "calculator", "arguments": {"expression": "sqrt(1764)"}}, "expected_output": "{\"name\": \"calculator\", \"arguments\": {\"expression\": \"sqrt(1764)\"}}"}
{"messages": [{"role": "user", "content": "Who won the 2022 FIFA World Cup?"}], "tools": [{"name": "web_search", "description": "Search the web.", "parameters": {"type": "object", "properties": {"query": {"type": "string"}}, "required": ["query"]}}], "expected": {"name": "web_search", "arguments": {"query": "2022 FIFA World Cup winner"}}, "expected_output": "{\"name\": \"web_search\", \"arguments\": {\"query\": \"2022 FIFA World Cup winner\"}}"}
{"messages": [{"role": "user", "content": "Remember that my flight is on Tuesday."}], "tools": [{"name": "memory", "description": "Persist key/value notes.", "parameters": {"type": "object", "properties": {"action": {"type": "string"}, "key": {"type": "string"}, "value": {"type": "string"}}, "required": ["action"]}}], "expected": {"name": "memory", "arguments": {"action": "remember", "key": "flight", "value": "Tuesday"}}, "expected_output": "{\"name\": \"memory\", \"arguments\": {\"action\": \"remember\", \"key\": \"flight\", \"value\": \"Tuesday\"}}"}
{"messages": [{"role": "user", "content": "Set a 5-minute timer for my tea."}], "tools": [{"name": "timer", "description": "Set timers and stopwatches.", "parameters": {"type": "object", "properties": {"action": {"type": "string"}, "seconds": {"type": "number"}, "label": {"type": "string"}}, "required": ["action"]}}], "expected": {"name": "timer", "arguments": {"action": "set_timer", "seconds": 300, "label": "tea"}}, "expected_output": "{\"name\": \"timer\", \"arguments\": {\"action\": \"set_timer\", \"seconds\": 300, \"label\": \"tea\"}}"}
{"messages": [{"role": "user", "content": "What is 1000 divided by 8?"}], "tools": [{"name": "calculator", "description": "Evaluate an arithmetic expression.", "parameters": {"type": "object", "properties": {"expression": {"type": "string"}}, "required": ["expression"]}}], "expected": {"name": "calculator", "arguments": {"expression": "1000/8"}}, "expected_output": "{\"name\": \"calculator\", \"arguments\": {\"expression\": \"1000/8\"}}"}
{"messages": [{"role": "user", "content": "Search for the tallest mountain in the world."}], "tools": [{"name": "web_search", "description": "Search the web.", "parameters": {"type": "object", "properties": {"query": {"type": "string"}}, "required": ["query"]}}], "expected": {"name": "web_search", "arguments": {"query": "tallest mountain in the world"}}, "expected_output": "{\"name\": \"web_search\", \"arguments\": {\"query\": \"tallest mountain in the world\"}}"}
{"messages": [{"role": "user", "content": "What did I tell you about my flight?"}], "tools": [{"name": "memory", "description": "Persist key/value notes.", "parameters": {"type": "object", "properties": {"action": {"type": "string"}, "key": {"type": "string"}, "value": {"type": "string"}}, "required": ["action"]}}], "expected": {"name": "memory", "arguments": {"action": "recall", "key": "flight"}}, "expected_output": "{\"name\": \"memory\", \"arguments\": {\"action\": \"recall\", \"key\": \"flight\"}}"}
{"messages": [{"role": "user", "content": "How long has it been since I started my workout stopwatch?"}], "tools": [{"name": "timer", "description": "Set timers and stopwatches.", "parameters": {"type": "object", "properties": {"action": {"type": "string"}, "label": {"type": "string"}}, "required": ["action"]}}], "expected": {"name": "timer", "arguments": {"action": "stop_stopwatch", "label": "workout"}}, "expected_output": "{\"name\": \"timer\", \"arguments\": {\"action\": \"stop_stopwatch\", \"label\": \"workout\"}}"}
{"messages": [{"role": "user", "content": "Compute 2 to the power of 16."}], "tools": [{"name": "calculator", "description": "Evaluate an arithmetic expression.", "parameters": {"type": "object", "properties": {"expression": {"type": "string"}}, "required": ["expression"]}}], "expected": {"name": "calculator", "arguments": {"expression": "2^16"}}, "expected_output": "{\"name\": \"calculator\", \"arguments\": {\"expression\": \"2^16\"}}"}