Spaces:

peijun1
/

AIstudioProxyAPI

Paused

App Files Files Community

AIstudioProxyAPI / tests /api_utils /test_utils_tool_execution.py

peijun1

Deploy AI Studio Proxy API to Hugging Face Spaces

a5784e9 18 days ago

Raw

History Blame Contribute Delete

15.7 kB

	"""
	High-quality tests for api_utils/utils.py - Tool execution safety (zero mocking of core logic).

	Focus: Test maybe_execute_tools with emphasis on async safety and edge cases.
	Strategy: Mock only external boundaries (execute_tool_call, register_runtime_tools).
	"""

	import asyncio
	from typing import List, cast
	from unittest.mock import AsyncMock, patch

	import pytest

	from models import Message, MessageContentItem


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_cancelled_error_reraised():
	"""
	Test scenario: Correctly re-throw CancelledError when function is cancelled
	Expected: CancelledError not swallowed, must be re-thrown
	This is a CRITICAL test - prevents request hang
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [Message(role="user", content="test")]
	tools = [{"function": {"name": "test_tool"}}]
	tool_choice = {"type": "function", "function": {"name": "test_tool"}}

	# Mock execute_tool_call to raise CancelledError - patch where it's imported/used
	with patch(
	"api_utils.utils_ext.tools_execution.execute_tool_call", new_callable=AsyncMock
	) as mock_exec:
	mock_exec.side_effect = asyncio.CancelledError()
	with patch("api_utils.utils_ext.tools_execution.register_runtime_tools"):
	# Expected: CancelledError re-thrown
	with pytest.raises(asyncio.CancelledError):
	await maybe_execute_tools(messages, tools, tool_choice)


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_tool_choice_dict_format():
	"""
	Test scenario: tool_choice as dictionary format {"type": "function", "function": {"name": "foo"}}
	Expected: Extract function name and execute
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [Message(role="user", content='{"arg": "value"}')]
	tools = [{"function": {"name": "my_function"}}]
	tool_choice = {"type": "function", "function": {"name": "my_function"}}

	with (
	patch(
	"api_utils.utils_ext.tools_execution.execute_tool_call",
	new_callable=AsyncMock,
	) as mock_exec,
	patch("api_utils.utils_ext.tools_execution.register_runtime_tools"),
	):
	mock_exec.return_value = '{"result": "success"}'

	result = await maybe_execute_tools(messages, tools, tool_choice)

	# Verify: execute_tool_call called with correct parameters
	mock_exec.assert_called_once_with("my_function", '{"arg": "value"}')
	assert result is not None
	assert len(result) == 1
	assert result[0]["name"] == "my_function"
	assert result[0]["arguments"] == '{"arg": "value"}'
	assert result[0]["result"] == '{"result": "success"}'


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_tool_choice_string_none():
	"""
	Test scenario: tool_choice as string "none" (case-insensitive)
	Expected: Return None, no tool executed
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [Message(role="user", content="test")]
	tools = [{"function": {"name": "test_tool"}}]

	with patch("api_utils.utils_ext.tools_execution.register_runtime_tools"):
	for choice in ["none", "None", "NONE", "no", "NO", "off", "OFF"]:
	result = await maybe_execute_tools(messages, tools, choice)
	assert result is None


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_tool_choice_auto_single_tool():
	"""
	Test scenario: tool_choice as "auto" and only one tool
	Expected: Automatically execute that tool
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [Message(role="user", content='{"x": 1}')]
	tools = [{"function": {"name": "only_tool"}}]

	with (
	patch(
	"api_utils.utils_ext.tools_execution.execute_tool_call",
	new_callable=AsyncMock,
	) as mock_exec,
	patch("api_utils.utils_ext.tools_execution.register_runtime_tools"),
	):
	mock_exec.return_value = '{"done": true}'

	for choice in ["auto", "required", "any"]:
	result = await maybe_execute_tools(messages, tools, choice)

	assert result is not None
	assert result[0]["name"] == "only_tool"
	mock_exec.assert_called_with("only_tool", '{"x": 1}')
	mock_exec.reset_mock()


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_tool_choice_auto_multiple_tools():
	"""
	Test scenario: tool_choice as "auto" but multiple tools
	Expected: No tool executed (as automatic choice is not possible)
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [Message(role="user", content="test")]
	tools = [
	{"function": {"name": "tool1"}},
	{"function": {"name": "tool2"}},
	]

	with patch("api_utils.utils_ext.tools_execution.register_runtime_tools"):
	result = await maybe_execute_tools(messages, tools, "auto")
	assert result is None


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_tool_choice_direct_name():
	"""
	Test scenario: tool_choice as function name string (direct specification)
	Expected: Execute that function
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [Message(role="user", content='{"param": 123}')]
	tools = [{"function": {"name": "direct_call"}}]

	with (
	patch(
	"api_utils.utils_ext.tools_execution.execute_tool_call",
	new_callable=AsyncMock,
	) as mock_exec,
	patch("api_utils.utils_ext.tools_execution.register_runtime_tools"),
	):
	mock_exec.return_value = '{"status": "ok"}'

	result = await maybe_execute_tools(messages, tools, "direct_call")

	assert result is not None
	assert result[0]["name"] == "direct_call"
	mock_exec.assert_called_once_with("direct_call", '{"param": 123}')


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_tool_choice_none():
	"""
	Test scenario: tool_choice is None
	Expected: Do not actively execute tool, return None
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [Message(role="user", content="test")]
	tools = [{"function": {"name": "test_tool"}}]

	with patch("api_utils.utils_ext.tools_execution.register_runtime_tools"):
	result = await maybe_execute_tools(messages, tools, None)
	assert result is None


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_arguments_from_user_text():
	"""
	Test scenario: Extract JSON from the latest user message as parameters
	Expected: Use _extract_json_from_text to extract JSON
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [
	Message(role="system", content="System message"),
	Message(role="user", content="First user message"),
	Message(role="assistant", content="Response"),
	Message(
	role="user",
	content='Call function with params: {"key": "value", "num": 42}',
	),
	]
	tools = [{"function": {"name": "test_func"}}]
	tool_choice = "test_func"

	with (
	patch(
	"api_utils.utils_ext.tools_execution.execute_tool_call",
	new_callable=AsyncMock,
	) as mock_exec,
	patch("api_utils.utils_ext.tools_execution.register_runtime_tools"),
	):
	mock_exec.return_value = "ok"

	result = await maybe_execute_tools(messages, tools, tool_choice)

	# Verify: Parameters extracted as JSON from the last user message
	mock_exec.assert_called_once_with("test_func", '{"key": "value", "num": 42}')
	assert result is not None
	assert result[0]["arguments"] == '{"key": "value", "num": 42}'


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_arguments_fallback_empty():
	"""
	Test scenario: No valid JSON in user message
	Expected: Use empty parameters "{}"
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [Message(role="user", content="No JSON here, just plain text")]
	tools = [{"function": {"name": "my_tool"}}]
	tool_choice = "my_tool"

	with (
	patch(
	"api_utils.utils_ext.tools_execution.execute_tool_call",
	new_callable=AsyncMock,
	) as mock_exec,
	patch("api_utils.utils_ext.tools_execution.register_runtime_tools"),
	):
	mock_exec.return_value = "done"

	result = await maybe_execute_tools(messages, tools, tool_choice)

	# Verify: Parameters fall back to empty JSON
	mock_exec.assert_called_once_with("my_tool", "{}")
	assert result is not None
	assert result[0]["arguments"] == "{}"


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_existing_tool_result_skip():
	"""
	Test scenario: Message with role='tool' already in message list
	Expected: No further tool execution, return None (follows conversational call loop)
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [
	Message(role="user", content='{"x": 1}'),
	Message(role="assistant", content="Let me call the tool"),
	# Already have tool result message
	Message(role="tool", content='{"result": "previous call"}'),
	]
	tools = [{"function": {"name": "my_tool"}}]
	tool_choice = "my_tool"

	with patch("api_utils.utils_ext.tools_execution.register_runtime_tools"):
	result = await maybe_execute_tools(messages, tools, tool_choice)

	# Verify: No execution because tool result already exists
	assert result is None


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_base_exception_returns_none():
	"""
	Test scenario: execute_tool_call throws common exception (non-CancelledError)
	Expected: Catch exception, return None
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [Message(role="user", content='{"arg": "val"}')]
	tools = [{"function": {"name": "failing_tool"}}]
	tool_choice = "failing_tool"

	with (
	patch(
	"api_utils.utils_ext.tools_execution.execute_tool_call",
	new_callable=AsyncMock,
	) as mock_exec,
	patch("api_utils.utils_ext.tools_execution.register_runtime_tools"),
	):
	# Mock common exception
	mock_exec.side_effect = ValueError("Something went wrong")

	result = await maybe_execute_tools(messages, tools, tool_choice)

	# Verify: Exception caught, return None
	assert result is None


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_register_runtime_tools_called():
	"""
	Test scenario: Verify register_runtime_tools called correctly
	Expected: Register tools on each maybe_execute_tools call
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [Message(role="user", content="test")]
	tools = [{"function": {"name": "tool1"}}, {"function": {"name": "tool2"}}]
	tool_choice = "tool1"

	with (
	patch(
	"api_utils.utils_ext.tools_execution.execute_tool_call",
	new_callable=AsyncMock,
	) as mock_exec,
	patch(
	"api_utils.utils_ext.tools_execution.register_runtime_tools"
	) as mock_register,
	):
	mock_exec.return_value = "ok"

	await maybe_execute_tools(messages, tools, tool_choice)

	# Verify: register_runtime_tools called with tools and None (default MCP endpoint)
	mock_register.assert_called_once_with(tools, None)


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_empty_messages():
	"""
	Test scenario: Message list is empty
	Expected: No user text, parameters fall back to "{}"
	"""
	from api_utils.utils import maybe_execute_tools

	messages = []
	tools = [{"function": {"name": "test_tool"}}]
	tool_choice = "test_tool"

	with (
	patch(
	"api_utils.utils_ext.tools_execution.execute_tool_call",
	new_callable=AsyncMock,
	) as mock_exec,
	patch("api_utils.utils_ext.tools_execution.register_runtime_tools"),
	):
	mock_exec.return_value = "done"

	await maybe_execute_tools(messages, tools, tool_choice)

	# Verify: Parameters are empty JSON
	mock_exec.assert_called_once_with("test_tool", "{}")


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_no_chosen_name():
	"""
	Test scenario: No function name obtained after tool_choice parsing
	Expected: Return None
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [Message(role="user", content="test")]
	tools = [{"function": {"name": "test_tool"}}]

	with patch("api_utils.utils_ext.tools_execution.register_runtime_tools"):
	# tool_choice is empty dict, no function.name
	result1 = await maybe_execute_tools(messages, tools, {})
	assert result1 is None

	# tool_choice is dict but function.name missing
	result2 = await maybe_execute_tools(
	messages, tools, {"type": "function", "function": {}}
	)
	assert result2 is None


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_multiline_json_extraction():
	"""
	Test scenario: User message contains multiline JSON
	Expected: Correctly extract multiline JSON
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [
	Message(
	role="user",
	content="""Please call the function with:
	{
	"param1": "value1",
	"param2": "value2",
	"nested": {
	"key": "val"
	}
	}
	Thank you!""",
	)
	]
	tools = [{"function": {"name": "multi_tool"}}]
	tool_choice = "multi_tool"

	with (
	patch(
	"api_utils.utils_ext.tools_execution.execute_tool_call",
	new_callable=AsyncMock,
	) as mock_exec,
	patch("api_utils.utils_ext.tools_execution.register_runtime_tools"),
	):
	mock_exec.return_value = "ok"

	await maybe_execute_tools(messages, tools, tool_choice)

	# Verify: Full multiline JSON extracted
	called_args = mock_exec.call_args[0][1]
	import json

	parsed = json.loads(called_args)
	assert parsed["param1"] == "value1"
	assert parsed["nested"]["key"] == "val"


	@pytest.mark.asyncio
	async def test_maybe_execute_tools_list_content_extraction():
	"""
	Test scenario: User message content as list (containing text and images)
	Expected: Extract JSON from text parts
	"""
	from api_utils.utils import maybe_execute_tools

	messages = [
	Message(
	role="user",
	content=cast(
	List[MessageContentItem],
	[
	{"type": "text", "text": "Before image"},
	{
	"type": "image_url",
	"image_url": {"url": "http://example.com/img.jpg"},
	},
	{"type": "text", "text": '{"action": "process_image"}'},
	],
	),
	)
	]
	tools = [{"function": {"name": "image_tool"}}]
	tool_choice = "image_tool"

	with (
	patch(
	"api_utils.utils_ext.tools_execution.execute_tool_call",
	new_callable=AsyncMock,
	) as mock_exec,
	patch("api_utils.utils_ext.tools_execution.register_runtime_tools"),
	):
	mock_exec.return_value = "processed"

	await maybe_execute_tools(messages, tools, tool_choice)

	# Verify: JSON extracted from concatenated text
	# _get_latest_user_text concatenates: "Before image\n{\"action\": \"process_image\"}"
	# _extract_json_from_text extracts: {"action": "process_image"}
	mock_exec.assert_called_once_with("image_tool", '{"action": "process_image"}')