Spaces:

dedp
/

harbor

Sleeping

App Files Files Community

harbor / src /chat.py

amitashukla

fix

4228096 verified about 2 months ago

raw

history blame contribute delete

10.4 kB

	from huggingface_hub import InferenceClient
	from src.config import BASE_MODEL, MY_MODEL, HF_TOKEN
	import os
	from src.utils.profile import load_schema, create_empty_profile, extract_profile_updates, merge_profile, profile_to_summary
	from src.utils.resources import load_resources, filter_resources, score_resources, format_resources_for_context

	RECOMMENDATION_KEYWORDS = [
	"show me", "show options", "show recommendations", "give me options",
	"what options", "what facilities", "find me", "recommend", "recommendations",
	"options near", "what's available", "what is available", "what are my options",
	"just show", "see options", "see recommendations", "list options",
	"i want to see", "can you show", "what do you have",
	]

	REQUIRED_PROFILE_FIELDS = [
	("clinical", "primary_focus"), # type of help
	("preferences", "setting"), # treatment setting
	("logistics", "insurance"), # payment / insurance
	]


	def _has_enough_for_recommendation(profile: dict) -> bool:
	"""Return True when the four key fields are collected."""
	for category, field in REQUIRED_PROFILE_FIELDS:
	value = profile.get(category, {}).get(field)
	if not value:
	return False
	# location: either zipcode or region
	zipcode = profile.get("logistics", {}).get("zipcode")
	region = profile.get("logistics", {}).get("region")
	if not zipcode and not region:
	return False
	return True


	def _user_wants_recommendations(user_input: str) -> bool:
	"""Return True if the user is explicitly asking for recommendations."""
	lower = user_input.lower()
	return any(kw in lower for kw in RECOMMENDATION_KEYWORDS)


	CRISIS_KEYWORDS = [
	"suicid", "kill myself", "want to die", "end my life", "take my life",
	"don't want to live", "dont want to live", "no reason to live",
	"better off dead", "self-harm", "self harm", "hurt myself", "cutting myself",
	"overdose", "overdosing",
	]

	CRISIS_RESPONSE = (
	"I'm really sorry you're going through something this difficult. "
	"You don't have to handle it alone.\n\n"
	"Please reach out for immediate support:\n\n"
	"Behavioral Health Help Line (BHHL)\n"
	"📞 Call or text: 833-773-2445\n"
	"Available 24 hours a day, 7 days a week, 365 days a year.\n"
	"Anyone may contact the Help Line if they or a family member are experiencing "
	"a mental health or substance use disorder crisis.\n\n"
	"If you or someone near you may be in immediate danger, please call 911 right now."
	)


	def _is_crisis(text: str) -> bool:
	lower = text.lower()
	return any(kw in lower for kw in CRISIS_KEYWORDS)


	class Chatbot:

	def __init__(self):
	"""
	Initialize the chatbot with a HF model ID
	"""
	model_id = MY_MODEL if MY_MODEL else BASE_MODEL # define MY_MODEL in config.py if you create a new model in the HuggingFace Hub
	self.client = InferenceClient(model=model_id, token=HF_TOKEN)
	# Initialize user profile
	current_dir = os.path.dirname(os.path.abspath(__file__))
	data_dir = os.path.join(current_dir, '..', 'data')
	self.profile_schema = load_schema(os.path.join(data_dir, 'user_profile_schema.json'))
	self.user_profile = create_empty_profile()
	# Load treatment resources once
	knowledge_dir = os.path.join(data_dir, '..', 'references', 'knowledge')
	resources_paths = [
	os.path.join(knowledge_dir, 'ma_resources.csv'),
	os.path.join(knowledge_dir, 'resources', 'boston_resources.csv'),
	]
	self.resources = load_resources(resources_paths)

	def reset(self):
	"""Reset conversation state for a new session without re-initializing the client or resources."""
	self.user_profile = create_empty_profile()

	def update_profile(self, user_input):
	"""
	Scan user input for profile-relevant information and merge it
	into the running user profile.

	Args:
	user_input (str): The user's message text.
	"""
	updates = extract_profile_updates(self.profile_schema, user_input)
	merge_profile(self.user_profile, updates)

	def format_prompt(self, user_input, turn_number=0):
	"""
	Format the user's input into a list of chat messages with system context.
	Updates the user profile with any new information detected from the message.

	This method:
	1. Loads system prompt from system_prompt.md
	2. Updates user profile from schema-based extraction
	3. Injects profile summary into the system prompt so the model knows what's been gathered
	4. Returns a list of message dicts for the chat completion API

	Args:
	user_input (str): The user's question
	turn_number (int): Zero-indexed turn count (0 = first user message)

	Returns:
	list[dict]: A list of message dicts with 'role' and 'content' keys
	"""
	# Get the directory where this file is located
	current_dir = os.path.dirname(os.path.abspath(__file__))

	# Load system prompt
	system_prompt_path = os.path.join(current_dir, '../data/system_prompt.md')
	with open(system_prompt_path, 'r', encoding='utf-8') as f:
	system_prompt = f.read().strip()

	# Update user profile from this message
	self.update_profile(user_input)

	# Build profile summary for the prompt
	profile_summary = profile_to_summary(self.user_profile)

	# Build system message with profile context
	system_content = system_prompt
	if profile_summary:
	system_content = system_content + "\n\n" + profile_summary

	# On the 4th user message (turn_number >= 3), nudge the model to ask a matching question
	if turn_number >= 3:
	missing = []
	clinical = self.user_profile.get("clinical", {})
	preferences = self.user_profile.get("preferences", {})
	logistics = self.user_profile.get("logistics", {})
	if not clinical.get("primary_focus"):
	missing.append("type of help needed (substance use, mental health, or both)")
	if not preferences.get("setting"):
	missing.append("preferred treatment setting")
	if not logistics.get("insurance"):
	missing.append("payment method or insurance")
	if not logistics.get("zipcode") and not logistics.get("region"):
	missing.append("location (zip code or city)")

	if missing:
	nudge = (
	"\n\n[PACING INSTRUCTION — DO NOT REPEAT TO USER] "
	"You have now had several exchanges. You MUST include a question relevant to "
	"treatment matching in this response. Ask about one of the following missing fields: "
	+ "; ".join(missing)
	+ ". Ask it warmly and conversationally — one question only."
	)
	system_content = system_content + nudge

	# Return structured messages for chat completion API
	messages = [{"role": "system", "content": system_content}]

	return messages

	def get_response(self, user_input, history=None):
	"""
	Generate a response to the user's question, with resource recommendations
	appended when the user profile contains enough information to match.

	Args:
	user_input (str): The user's question

	Returns:
	str: The chatbot's response, optionally followed by top 3 resources
	"""
	# 0. Hard crisis check — bypass LLM entirely if crisis keywords detected
	if _is_crisis(user_input):
	print("[Harbor] Crisis keywords detected — returning crisis response.")
	return CRISIS_RESPONSE

	# 1. Format messages (also updates profile)
	turn_number = len(history) if history else 0
	messages = self.format_prompt(user_input, turn_number=turn_number)

	# 1b. After the user's first message, return a fixed follow-up instead of calling the LLM.
	# Profile has already been updated above so the first message is not lost.
	if history and len(history) == 1:
	return (
	"Thank you for sharing that. Before I give you any recommendations, "
	"can you tell me a little bit about you or the loved one you are concerned about?"
	)

	# 2. Inject verified facility data into the system prompt so the LLM presents
	# recommendations naturally in its own voice — only when the profile has enough
	# info or the user is explicitly asking for options.
	if _has_enough_for_recommendation(self.user_profile) or _user_wants_recommendations(user_input):
	filtered = filter_resources(self.resources, self.user_profile)
	top = score_resources(filtered, self.user_profile)
	if top:
	facility_context = format_resources_for_context(top)
	messages[0]["content"] = messages[0]["content"] + "\n\n" + facility_context
	elif _has_enough_for_recommendation(self.user_profile):
	messages[0]["content"] = messages[0]["content"] + (
	"\n\n[NOTE — No verified facilities matched the user's profile. "
	"Let the user know you couldn't find a direct match and ask if "
	"they'd be open to broader options.]"
	)

	# 3. Append conversation history then current user message
	for item in (history or []):
	if isinstance(item, dict):
	messages.append({"role": item["role"], "content": item["content"]})
	else:
	human, assistant = item
	messages.append({"role": "user", "content": human})
	if assistant is not None:
	messages.append({"role": "assistant", "content": assistant})
	messages.append({"role": "user", "content": user_input})

	# 4. Generate LLM response via chat completion API
	result = self.client.chat_completion(
	messages=messages,
	max_tokens=512,
	temperature=0.7,
	)
	return result.choices[0].message.content.strip()