Spaces:

AvocadoMuffin
/

Gemma_Chatbot

Sleeping

App Files Files Community

Gemma_Chatbot / app.py

AvocadoMuffin

Update app.py

f239ec4 verified 10 months ago

raw

history blame contribute delete

24.2 kB

	import gradio as gr
	#from gradio.components import Box
	import torch
	import os
	import faiss
	import pickle
	from transformers import AutoModelForCausalLM, AutoTokenizer
	from sentence_transformers import SentenceTransformer, util
	from huggingface_hub import hf_hub_download
	import pandas as pd
	from datasets import Dataset
	from huggingface_hub import create_repo

	os.environ["HF_HUB_ENABLE_HF_TRANSFER"] = "0"

	# 🔹 Ensure bitsandbytes installation (for efficient model loading)
	try:
	if torch.cuda.is_available():
	import bitsandbytes as bnb # Use the GPU version if CUDA is available
	print("Using bitsandbytes with GPU support.")
	else:
	import bitsandbytes # Fallback to CPU version (as bitsandbytes supports both)
	print("Using bitsandbytes with CPU support.")
	except ImportError:
	print("bitsandbytes not found, falling back to CPU.")

	# 🔹 Load Hugging Face Model Repo Details
	MODEL_NAME = "AvocadoMuffin/Gemma_Fine_Tuned_Model"
	HF_TOKEN = os.getenv("HF_TOKEN") # Ensure this is set in your environment

	# 🔹 Load Tokenizer & Model
	device = "cuda" if torch.cuda.is_available() else "cpu"
	dtype = torch.float16 if torch.cuda.is_available() else torch.float32

	tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME, token=HF_TOKEN)
	model = AutoModelForCausalLM.from_pretrained(MODEL_NAME, torch_dtype=dtype, token=HF_TOKEN).to(device)

	tokenizer.pad_token = tokenizer.eos_token

	# 🔹 Load FAISS Index & Knowledge from HF Model Repo
	faiss_index_path = hf_hub_download(repo_id=MODEL_NAME, filename="faiss_index/index.faiss", token=HF_TOKEN)
	knowledge_path = hf_hub_download(repo_id=MODEL_NAME, filename="faiss_index/knowledge.pkl", token=HF_TOKEN)

	# Load FAISS Index
	index = faiss.read_index(faiss_index_path)

	# Load Knowledge.pkl (Contains text data + embeddings)
	with open(knowledge_path, "rb") as f:
	knowledge_data = pickle.load(f)

	# Validate knowledge data
	if isinstance(knowledge_data, dict) and "questions" in knowledge_data and "answers" in knowledge_data:
	questions = knowledge_data["questions"]
	answers = knowledge_data["answers"]
	else:
	raise ValueError("❌ knowledge.pkl does not contain expected questions and answers keys!")

	# 🔹 Load Sentence Transformer Embedding Model
	embedding_model = SentenceTransformer("multi-qa-mpnet-base-dot-v1")

	print("✅ FAISS Index, Knowledge Data, and Embedding Model Loaded Successfully!")

	# 🔹 Function: Retrieve Relevant Context from FAISS
	def retrieve_relevant_context(query, index, answers, embedding_model, top_k=3, similarity_threshold=0.8):
	"""Retrieve top-k relevant knowledge snippets from FAISS index."""

	query_embedding = embedding_model.encode([query], convert_to_numpy=True)
	distances, indices = index.search(query_embedding, top_k)

	retrieved_contexts = []
	seen_embeddings = []

	for idx in indices[0]:
	if 0 <= idx < len(answers):
	answer = answers[idx]
	answer_embedding = embedding_model.encode([answer], convert_to_numpy=True)

	if all(util.cos_sim(answer_embedding, emb) < similarity_threshold for emb in seen_embeddings):
	retrieved_contexts.append(answer)
	seen_embeddings.append(answer_embedding)

	return "\n".join(retrieved_contexts[:top_k])

	# Define system messages for different modes
	SYSTEM_MESSAGES = {
	"general": "You are a helpful AI assistant for everyday tasks.",
	"mental_health": "You are a helpful AI assistant for mental health."
	}

	# Mental health keywords to check if query is related to mental health
	MENTAL_HEALTH_KEYWORDS = [
	"anxiety", "depression", "stress", "therapy", "counseling", "mental health", "panic", "trauma",
	"mindfulness", "meditation", "psychological", "self-care", "emotion", "feeling", "mood",
	"psychiatry", "therapist", "psychologist", "burnout", "coping", "ptsd", "ocd", "adhd", "bipolar",
	"schizophrenia", "grief", "insomnia", "wellbeing", "mental wellbeing", "mental wellness",
	"emotional wellbeing", "emotional wellness", "self-help", "relaxation", "breathing exercise",
	"cognitive behavioral", "cbt", "sad", "angry", "worried", "anxious", "depressed", "overwhelmed",
	"psychology", "mental disorder", "suicide", "suicidal", "crisis", "loneliness", "lonely", "isolated",
	"phobia", "trauma", "addiction", "substance abuse", "eating disorder", "self-esteem", "confidence"
	]

	# Function to check if a query is related to mental health
	def is_mental_health_query(query):
	query_lower = query.lower()
	return any(keyword in query_lower for keyword in MENTAL_HEALTH_KEYWORDS)

	# 🔹 Function: Generate Response Using RAG
	def generate_rag_response(query, model, tokenizer, index, answers, embedding_model, chat_history, system_message, max_new_tokens=200):
	"""Generate response using retrieved context, chat history, and system message."""

	# Check if query is mental health related when in mental health mode
	if system_message == SYSTEM_MESSAGES["mental_health"] and not is_mental_health_query(query):
	return "I'm currently in mental health assistant mode and can only answer questions related to mental health, psychology, emotions, and wellbeing. If you'd like to discuss other topics, please change the system message to general assistant mode."

	query_lower = query.strip().lower()

	# Define follow-up triggers
	follow_up_triggers = ["continue", "go on", "tell me more", "what else?", "elaborate", "explain more"]
	is_follow_up = any(trigger in query_lower for trigger in follow_up_triggers)

	# Retrieve relevant knowledge
	retrieved_context = retrieve_relevant_context(query, index, answers, embedding_model).strip()

	# Store last 5 exchanges in chat history (limit it)
	chat_context = "\n".join([msg["content"] for msg in chat_history[-5:]])

	# Handle Follow-up Responses More Effectively
	if is_follow_up and chat_history:
	last_ai_response = chat_history[-1] # Get last AI message
	query = f"{last_ai_response['content']} {query}" # Append the follow-up to continue smoothly

	# Few-Shot Examples for Mental Health mode only
	few_shot_examples = """
	User: What are some effective meditation techniques for beginners?
	AI: Based on established research, here are some effective meditation techniques for beginners:

	1. Mindful Breathing - Focus on your breath, noticing the sensation of air moving in and out of your body.
	2. Body Scan Meditation - Progressively relax different parts of your body from head to toe.
	3. Loving-Kindness Meditation - Direct positive wishes toward yourself and others.
	4. Guided Meditation - Follow along with recorded instructions to help maintain focus.
	5. Walking Meditation - Practice mindfulness while walking slowly and deliberately.

	I recommend starting with just 5 minutes daily and gradually increasing duration. Would you like more details about any specific technique, or would you prefer suggestions for apps that could help you get started?

	User: Tell me more about body scan meditation.
	AI: Body scan meditation is a mindfulness practice where you systematically focus your attention on different parts of your body, from your toes to the top of your head.

	Here's how to practice it:
	1. Lie down in a comfortable position or sit in a chair with your feet on the ground
	2. Close your eyes and take several deep breaths
	3. Begin by bringing awareness to your toes, noticing any sensations (tingling, temperature, tension)
	4. Gradually move your attention upward (feet, ankles, calves, etc.)
	5. For each body part, notice sensations without judgment, then consciously relax that area
	6. If you notice pain or discomfort, acknowledge it with compassion before moving on
	7. Continue until you've scanned your entire body

	Regular practice can help reduce stress, improve body awareness, and release physical tension. Many find it helpful for sleep issues as well.

	Would you like guidance on how long to practice or how to handle common challenges like mind-wandering during body scans?
	"""

	# Build prompt depending on system message
	if system_message == SYSTEM_MESSAGES["mental_health"]:
	prompt = f"""You are a compassionate mental wellness assistant powered by a retrieval-augmented generation (RAG) system.
	Maintain a warm, supportive conversation while providing evidence-based mental health information.

	SYSTEM MESSAGE: {system_message}

	When responding to mental health queries:
	- Provide evidence-based information from reputable sources
	- Keep the tone supportive, non-judgmental, and empathetic
	- If uncertain about mental health information, acknowledge limitations and avoid potentially harmful advice
	- For crisis situations, recommend professional help rather than providing advice
	- Frame mental wellness information in a way that emphasizes self-compassion and gradual progress

	If the user expresses overwhelm, anxiety, or difficulty with their mental health, offer evidence-based coping strategies and gentle support.

	{few_shot_examples if len(chat_history) > 0 else ""}
	"""
	else:
	prompt = f"""You are a helpful AI assistant designed to answer questions on a wide range of topics.
	Provide accurate, concise information while maintaining a conversational tone.

	SYSTEM MESSAGE: {system_message}

	When responding to queries:
	- Provide accurate information on the requested topic
	- Keep explanations clear and easy to understand
	- Be conversational and friendly
	- If you don't know something, acknowledge limitations rather than making up information
	"""

	# Only append the relevant context if available
	if retrieved_context:
	prompt += f"\n📌 Relevant Information Retrieved:\n{retrieved_context}\n\n"

	prompt += f"💬 Chat History:\n{chat_context}\n👤 User: {query}\n🤖 AI:"

	# Tokenize input
	input_ids = tokenizer(prompt, return_tensors="pt").input_ids.to(device)

	# Generate AI response
	with torch.no_grad():
	output_ids = model.generate(
	input_ids,
	max_new_tokens=max_new_tokens,
	eos_token_id=tokenizer.eos_token_id,
	)

	response = tokenizer.decode(output_ids[0], skip_special_tokens=True).strip()

	# Prevent prompt repetition in response
	if response.startswith(prompt):
	response = response[len(prompt):].strip()

	return response


	# 🔹 Function to save feedback for RLHF
	from huggingface_hub import create_repo, HfApi
	from datasets import Dataset, load_dataset
	import pandas as pd
	import os
	import json

	def save_feedback(query, response, feedback, comment=""):
	feedback_file = "chat_feedback.csv"
	repo_name = "AvocadoMuffin/Chat_Feedback_Data"

	# Create new data from current feedback
	new_data = pd.DataFrame([[query, response, feedback, comment]],
	columns=["Query", "Response_Generated", "Feedback", "Comment"])

	try:
	# First check if we have a local copy of the data
	if os.path.exists(feedback_file):
	existing_data = pd.read_csv(feedback_file)
	print(f"Loaded existing data from local file with {len(existing_data)} records")
	else:
	# Try to download the dataset from HF Hub
	api = HfApi()
	try:
	# List all files in the repository to find our data
	files = api.list_repo_files(repo_id=repo_name, repo_type="dataset")

	# Look for parquet files which contain our data
	data_files = [f for f in files if f.endswith('.parquet') or f.endswith('.csv')]

	if data_files:
	# Download the first data file we find
	file_path = api.hf_hub_download(
	repo_id=repo_name,
	filename=data_files[0],
	repo_type="dataset"
	)

	# Load the data based on file extension
	if file_path.endswith('.parquet'):
	existing_data = pd.read_parquet(file_path)
	else:
	existing_data = pd.read_csv(file_path)

	print(f"Successfully loaded data from Hub with {len(existing_data)} records")
	else:
	print("No data files found in repository")
	existing_data = pd.DataFrame(columns=["Query", "Response_Generated", "Feedback", "Comment"])
	except Exception as e:
	print(f"Error accessing repository: {e}")
	existing_data = pd.DataFrame(columns=["Query", "Response_Generated", "Feedback", "Comment"])

	# Append new feedback to the existing data
	updated_data = pd.concat([existing_data, new_data], ignore_index=True)
	print(f"Updated dataset now has {len(updated_data)} records")

	# Always save locally for backup and future reference
	updated_data.to_csv(feedback_file, index=False)
	print(f"Saved updated data to local file with {len(updated_data)} records")

	# Convert to Hugging Face Dataset
	dataset = Dataset.from_pandas(updated_data)

	# Create repo if needed and push to Hugging Face Hub
	create_repo(repo_id=repo_name, repo_type="dataset", exist_ok=True)
	dataset.push_to_hub(repo_name)
	print("Feedback saved and dataset updated on Hugging Face!")

	except Exception as e:
	print(f"Error updating dataset: {e}")
	# Still save locally as backup
	if os.path.exists(feedback_file):
	local_data = pd.read_csv(feedback_file)
	pd.concat([local_data, new_data], ignore_index=True).to_csv(feedback_file, index=False)
	else:
	new_data.to_csv(feedback_file, index=False)
	print("Saved locally only due to error")

	return "Feedback saved and dataset updated!"


	# 🔹 The chatbot function (with RAG and conversation history tracking)
	def chatbot(query, chat_history=None, system_message=SYSTEM_MESSAGES["general"]):
	if chat_history is None:
	chat_history = [] # Initialize chat_history as an empty list

	# Append user message to the chat history
	chat_history.append({"role": "user", "content": query})

	# Generate response using the RAG model with specified system message
	response = generate_rag_response(query, model, tokenizer, index, answers, embedding_model, chat_history, system_message)

	# Append the assistant's response to the chat history for context
	chat_history.append({"role": "assistant", "content": response})

	# Format chat history with HTML and CSS for better visual appeal
	formatted_chat_history = ""
	for msg in chat_history:
	if msg["role"] == "user":
	formatted_chat_history += f'<p style="color: #4A90E2; font-weight: bold;">User:</p><p style="background-color: #E7F1F8; padding: 10px; border-radius: 5px; font-family: Arial, sans-serif; font-size: 14px;">{msg["content"]}</p>'
	else:
	formatted_chat_history += f'<p style="color: #1D4ED8; font-weight: bold;">AI:</p><p style="background-color: #D1F4D9; padding: 10px; border-radius: 5px; font-family: Arial, sans-serif; font-size: 14px;">{msg["content"]}</p>'

	# Return the formatted chat history as HTML and the updated chat history
	# Make sure to reset the feedback radio button value to None when showing new feedback options
	return gr.HTML(formatted_chat_history), chat_history, gr.update(visible=True, value=None), gr.update(visible=True), gr.update(visible=True, value=""), response, gr.update(value=""), query

	# Function to handle feedback submission
	def handle_feedback(query, latest_response, feedback, comment):
	# Store feedback as None if not selected
	if feedback: # Only save if feedback has a value
	feedback_value = 1 if feedback == "👍 Like" else 0
	save_feedback(query, latest_response, feedback_value, comment) # Save feedback data
	else:
	# If no feedback is selected, save as NULL or handle accordingly
	save_feedback(query, latest_response, None, comment)

	# Hide feedback UI after submission and clear both the comment field and feedback selection
	return gr.update(visible=False, value=None), gr.update(visible=False), gr.update(visible=False, value="")

	# Function to handle system message change and reset chat
	def change_system_message(message_key, chat_history_state):
	# Get the actual system message
	selected_message = SYSTEM_MESSAGES[message_key]

	# Reset chat history when mode changes
	new_chat_history = []

	# Create welcome message based on selected mode
	if message_key == "mental_health":
	welcome_message = "I'm now in mental health assistant mode. I can help with questions about mental health, wellness, emotions, and psychological well-being. How can I support you today?"
	else:
	welcome_message = "I'm here to help with a wide range of questions and tasks. What would you like assistance with today?"

	# Add welcome message to chat history
	new_chat_history.append({"role": "assistant", "content": welcome_message})

	# Format the welcome message for display
	formatted_chat_history = f'<p style="color: #1D4ED8; font-weight: bold;">AI:</p><p style="background-color: #D1F4D9; padding: 10px; border-radius: 5px; font-family: Arial, sans-serif; font-size: 14px;">{welcome_message}</p>'

	return gr.HTML(formatted_chat_history), new_chat_history, selected_message

	def create_gradio_interface():
	with gr.Blocks() as demo:
	gr.Markdown("## 🧠 Mindful Bot: AI for Everything")
	gr.Markdown("An AI chatbot designed to offer empathetic support for mental wellness using RAG-based techniques, capable of handling adversarial queries with care. It also provides insightful responses to general queries, separating wellness-related conversations for more focused, compassionate assistance.")

	latest_query = gr.State("")
	latest_response = gr.State("")
	chat_history_state = gr.State([])
	current_system_message = gr.State(SYSTEM_MESSAGES["general"])

	with gr.Row():
	with gr.Column(scale=7): # Chat area
	# Use gr.HTML to display the formatted chat history
	chat_history_box = gr.HTML(label="Chat History", elem_id="chat-history")

	with gr.Row():
	with gr.Column(scale=8):
	query = gr.Textbox(label="Enter your query", elem_id="user-input", lines=3)
	with gr.Column(scale=2):
	submit_button = gr.Button("Submit", elem_id="submit-button", variant="primary")

	# Feedback UI - make it optional with no default selection
	feedback = gr.Radio(choices=["👍 Like", "👎 Dislike"], label="Feedback (Optional)", type="value", visible=False)
	submit_feedback_button = gr.Button("Submit Feedback", visible=False)
	feedback_comments = gr.Textbox(label="Additional Comments (optional)", lines=2, visible=False)

	with gr.Column(scale=3): # System message area
	with gr.Group():
	gr.HTML("<h2 style='text-align: center; color: white; background-color: orange; padding: 10px;'>System message</h2>")

	# Example table with system messages
	example_table = gr.Dataframe(
	headers=["Message", "System message"],
	datatype=["str", "str"],
	value=[
	["Hello! How are you?", SYSTEM_MESSAGES["mental_health"]],
	["Can you help with a recipe for baking a cake?", SYSTEM_MESSAGES["general"]],
	],
	row_count=2,
	col_count=2,
	interactive=True,
	#height=150
	)

	# System message selector
	system_selector = gr.Radio(
	choices=["general", "mental_health"],
	value="general",
	label="Select system message type",
	elem_id="system-selector",
	info="Choose the type of assistant"
	)

	# Display the current system message
	system_message_display = gr.Textbox(
	value=SYSTEM_MESSAGES["general"],
	label="Current system instruction:",
	interactive=False
	)

	# Reset button
	reset_button = gr.Button("Reset Chat", elem_id="reset-button")

	# Additional inputs section
	#gr.Markdown("### Additional Inputs")

	# Add custom CSS with HTML component
	gr.HTML("""<style>
	#chat-history { background-color: #f5f5f5; border-radius: 10px; padding: 10px; max-height: 400px; overflow-y: scroll; font-family: 'Arial', sans-serif; }
	#user-input { margin-top: 10px; border-radius: 10px; }
	#submit-button { margin-top: 10px; }
	#system-selector { margin-top: 10px; }
	</style>""")

	# Event handlers
	query.submit(chatbot,
	inputs=[query, chat_history_state, current_system_message],
	outputs=[chat_history_box, chat_history_state, feedback, submit_feedback_button, feedback_comments, latest_response, query, latest_query])

	submit_button.click(chatbot,
	inputs=[query, chat_history_state, current_system_message],
	outputs=[chat_history_box, chat_history_state, feedback, submit_feedback_button, feedback_comments, latest_response, query, latest_query])

	# Modified feedback handling
	submit_feedback_button.click(handle_feedback,
	inputs=[latest_query, latest_response, feedback, feedback_comments],
	outputs=[feedback, submit_feedback_button, feedback_comments])

	# System message change handler
	system_selector.change(change_system_message,
	inputs=[system_selector, chat_history_state],
	outputs=[chat_history_box, chat_history_state, current_system_message])

	# Also update system message display when selector changes
	system_selector.change(lambda x: SYSTEM_MESSAGES[x],
	inputs=[system_selector],
	outputs=[system_message_display])

	# Reset button handler - uses the same function as system_selector.change
	reset_button.click(change_system_message,
	inputs=[system_selector, chat_history_state],
	outputs=[chat_history_box, chat_history_state, current_system_message])

	# Also reset system message display with reset button
	reset_button.click(lambda x: SYSTEM_MESSAGES[x],
	inputs=[system_selector],
	outputs=[system_message_display])

	# Initialize with welcome message on load
	demo.load(change_system_message,
	inputs=[system_selector, chat_history_state],
	outputs=[chat_history_box, chat_history_state, current_system_message])

	# Initialize system message display on load
	demo.load(lambda x: SYSTEM_MESSAGES[x],
	inputs=[system_selector],
	outputs=[system_message_display])

	return demo

	# Create and launch the Gradio interface
	demo = create_gradio_interface()
	demo.launch(share=False, debug=True)