Spaces:

pgits
/

voiceCal-ai-v2

Sleeping

App Files Files Community

voiceCal-ai-v2 / app /core /custom_parser.py

pgits

Implement custom ReActOutputParser to return tool responses verbatim

8dbd2ad 7 months ago

raw

history blame contribute delete

7.59 kB

	"""Custom output parser for ReActAgent that returns tool responses verbatim for booking confirmations."""

	from typing import Dict, Optional
	import re
	import logging

	from llama_index.core.agent.react.output_parser import ReActOutputParser
	from llama_index.core.agent.react.types import BaseReasoningStep, ResponseReasoningStep


	class VerbatimOutputParser(ReActOutputParser):
	"""Custom parser that returns tool responses verbatim for booking confirmations.

	This parser extends the default ReActOutputParser to detect specific tool responses
	(like booking confirmations) and return them directly to the user without the
	ReAct agent's typical summarization behavior.
	"""

	def __init__(self, verbatim_patterns: Optional[Dict[str, str]] = None):
	"""Initialize the verbatim output parser.

	Args:
	verbatim_patterns: Dictionary of pattern names to regex patterns that
	should trigger verbatim response handling.
	"""
	super().__init__()

	# Default patterns for detecting responses that should be returned verbatim
	self.verbatim_patterns = verbatim_patterns or {
	'booking_confirmation': r'Perfect! ✅.Meeting confirmed.📅',
	'meeting_ids': r'Meeting ID:.*Calendar ID:',
	'google_meet': r'🎥 Google Meet',
	'cancellation_success': r'✅.cancelled.successfully',
	'email_notification': r'📧 Email invitations',
	'celebration_marker': r'<div id="booking-success"',
	'authentication_error': r'I need to reconnect to your calendar'
	}

	# Set up logging
	self.logger = logging.getLogger(__name__)

	def should_return_verbatim(self, output: str) -> bool:
	"""Determine if output should be returned without ReAct processing.

	Args:
	output: The raw LLM output string

	Returns:
	True if this output should be returned verbatim, False otherwise
	"""
	# Check for tool response markers that indicate this is a complete tool response
	tool_response_indicators = [
	'Perfect! ✅', # Booking confirmation start
	'✅ Meeting', # Cancellation or meeting updates
	'📅 **', # Date/time formatting
	'Meeting ID:', # Meeting ID display
	'🎥 Google Meet', # Google Meet link
	'📧 Email invitations', # Email status
	'<div id="booking-success"', # Celebration marker
	'I need to reconnect', # Auth error
	'Oops! You already have', # Scheduling conflicts
	"I'm having trouble", # General errors
	'Available times:', # Availability responses
	'Here are your upcoming' # Event listing responses
	]

	# If any indicator is present, check against patterns
	if any(indicator in output for indicator in tool_response_indicators):
	for pattern_name, pattern in self.verbatim_patterns.items():
	if re.search(pattern, output, re.DOTALL \| re.IGNORECASE):
	self.logger.info(f"Verbatim response triggered by pattern: {pattern_name}")
	return True

	return False

	def extract_verbatim_response(self, output: str) -> str:
	"""Extract the clean verbatim response from the output.

	Args:
	output: The raw LLM output

	Returns:
	Cleaned response suitable for direct user display
	"""
	# If this looks like a tool response, try to extract just the tool output part

	# Look for "Observation:" followed by the tool response
	observation_pattern = r'Observation:\s(.?)(?=\n\nThought:\|$)'
	observation_match = re.search(observation_pattern, output, re.DOTALL)

	if observation_match:
	tool_response = observation_match.group(1).strip()
	self.logger.info(f"Extracted tool response from Observation: {tool_response[:100]}...")
	return tool_response

	# Look for responses that start with common tool response patterns
	response_start_patterns = [
	r'(Perfect! ✅.*)',
	r'(✅.Meeting.)',
	r'(I need to reconnect.*)',
	r'(Oops! You already have.*)', # Conflict messages
	r'(I\'m having trouble.*)', # Error messages
	]

	for pattern in response_start_patterns:
	match = re.search(pattern, output, re.DOTALL)
	if match:
	response = match.group(1).strip()
	self.logger.info(f"Extracted response by pattern: {response[:100]}...")
	return response

	# Handle cases where the output is already clean (direct tool response)
	if any(indicator in output for indicator in ['✅', '📅', '🎥', '📧', 'Meeting ID:']):
	self.logger.info("Output appears to be clean tool response already")
	return output.strip()

	# Fallback: return the output as-is if we can't extract cleanly
	self.logger.warning("Could not extract clean tool response, returning full output")
	return output.strip()

	def parse(self, output: str, is_streaming: bool = False) -> BaseReasoningStep:
	"""Parse the LLM output, returning verbatim responses when appropriate.

	Args:
	output: Raw LLM output string
	is_streaming: Whether this is part of a streaming response

	Returns:
	BaseReasoningStep - either verbatim ResponseReasoningStep or normal parsing
	"""
	try:
	# Check if this should be returned verbatim
	if self.should_return_verbatim(output):
	# Extract the clean response
	verbatim_response = self.extract_verbatim_response(output)

	# Return as a ResponseReasoningStep to end the ReAct loop
	return ResponseReasoningStep(
	thought="Tool provided complete response that should be returned verbatim.",
	response=verbatim_response,
	is_streaming=is_streaming
	)

	# Otherwise, use the default ReAct parsing
	return super().parse(output, is_streaming)

	except Exception as e:
	self.logger.error(f"Error in custom parser: {e}, falling back to default parsing")
	# Fallback to default parsing if our custom logic fails
	return super().parse(output, is_streaming)


	# Configuration for the verbatim parser
	VERBATIM_RESPONSE_CONFIG = {
	'enabled': True,
	'tools': ['create_appointment', 'cancel_meeting_by_id', 'cancel_meeting_by_details', 'check_availability', 'list_upcoming_events'],
	'patterns': {
	'booking_confirmation': r'Perfect! ✅.Meeting confirmed.📅',
	'meeting_ids': r'Meeting ID:.*Calendar ID:',
	'google_meet': r'🎥 Google Meet',
	'cancellation_success': r'✅.cancelled.successfully',
	'email_notification': r'📧 Email invitations',
	'celebration_marker': r'<div id="booking-success"',
	'authentication_error': r'I need to reconnect to your calendar',
	'scheduling_conflict': r'Oops! You already have.*scheduled at that time',
	'general_error': r"I'm having trouble.*right now",
	'availability_list': r'Available times:.*AM\|PM',
	'event_listing': r'Here are your upcoming.*meetings'
	},
	'fallback_on_error': True,
	'debug_logging': True
	}