Spaces:

Lesterchia1
/

Test_TutorAI_We

Build error

App Files Files Community

Test_TutorAI_We / app.py

Lesterchia1

Update app.py

40fa7be verified 3 days ago

raw

history blame

7.87 kB

	import os
	import re
	import uuid
	import tempfile
	import numpy as np
	import gradio as gr
	import chardet
	import fitz # PyMuPDF
	import docx
	import gtts
	from pptx import Presentation
	from typing import TypedDict, List
	from langchain_community.tools import DuckDuckGoSearchRun
	from langchain_core.messages import BaseMessage, HumanMessage, AIMessage, SystemMessage
	from langgraph.graph import StateGraph, END
	from langchain_groq import ChatGroq
	#from langchain_huggingface.embeddings import HuggingFaceEmbeddings
	from langchain_community.embeddings import HuggingFaceEmbeddings
	from langchain_community.vectorstores import Chroma
	from langchain_text_splitters import RecursiveCharacterTextSplitter
	from langchain_core.documents import Document

	# --- 1. INITIALIZATION & CORE TOOLS ---
	groq_api_key = os.getenv("GROQ_API_KEY")

	chat_model = ChatGroq(model_name="llama-3.3-70b-versatile", api_key=groq_api_key)
	web_search_tool = DuckDuckGoSearchRun()
	embedding_model = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
	vectorstore = Chroma(embedding_function=embedding_model, persist_directory="chroma_db")

	# --- 2. HELPER FUNCTIONS ---


	def clean_response(response):
	"""Remove <think>...</think> blocks and common markdown artifacts."""
	# Remove think tags and their content (greedily, case-insensitive)
	cleaned = re.sub(r"<think>.*?(?:</think>\|$)", "", response, flags=re.DOTALL \| re.IGNORECASE)
	# Remove stray closing tags and markdown symbols
	cleaned = re.sub(r"</?think>\|\\\|\*\|\[\|\]\|#", "", cleaned)
	return cleaned.strip()
	#return cleaned_text.strip()


	def retrieve_documents(query):
	results = vectorstore.similarity_search(query, k=3)
	return [doc.page_content for doc in results]

	def speech_playback(text):
	try:
	unique_id = str(uuid.uuid4())
	audio_file = f"/content/output_audio_{unique_id}.mp3"
	tts = gtts.gTTS(text[:500], lang='en')
	tts.save(audio_file)
	return audio_file
	except Exception as e:
	print(f"TTS error: {e}")
	return None

	# --- 3. DOCUMENT INGESTION FUNCTION ---
	def extract_and_store_document(file_path: str):
	text = ""
	file_ext = os.path.splitext(file_path)[1].lower()

	try:
	if file_ext == ".pdf":
	doc = fitz.open(file_path)
	for page in doc:
	text += page.get_text()
	doc.close()
	elif file_ext == ".docx":
	doc = docx.Document(file_path)
	text = "\n".join([para.text for para in doc.paragraphs])
	elif file_ext == ".pptx":
	prs = Presentation(file_path)
	for slide in prs.slides:
	for shape in slide.shapes:
	if hasattr(shape, "text"):
	text += shape.text + "\n"
	else:
	with open(file_path, 'rb') as f:
	raw_data = f.read()
	encoding = chardet.detect(raw_data)['encoding'] or 'utf-8'
	text = raw_data.decode(encoding, errors='ignore')

	if not text.strip():
	return False

	splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=50)
	chunks = splitter.split_text(text)
	documents = [Document(page_content=chunk, metadata={"source": os.path.basename(file_path)}) for chunk in chunks]
	vectorstore.add_documents(documents)
	vectorstore.persist()
	return True

	except Exception as e:
	print(f"Error processing {file_path}: {e}")
	return False

	# --- 4. REFRAG MULTI-AGENT LOGIC (LangGraph) ---

	class AgentState(TypedDict):
	messages: List[BaseMessage]
	context: str
	decision: str
	source: str

	def sensing_node(state: AgentState):
	user_query = state["messages"][-1].content
	relevant_docs = retrieve_documents(user_query)
	context = "\n".join(relevant_docs) if relevant_docs else ""

	prompt = f"Docs: {context}\nQuery: {user_query}\nIf docs answer this, reply 'RAG'. Else reply 'WEB'."
	decision = chat_model.invoke([HumanMessage(content=prompt)]).content.strip().upper()
	return {"context": context, "decision": "RAG" if "RAG" in decision else "WEB"}

	def expansion_node(state: AgentState):
	if state["decision"] == "WEB":
	user_query = state["messages"][-1].content
	web_data = web_search_tool.run(user_query)
	return {"context": f"WEB INFO: {web_data}\nLOCAL: {state['context']}", "source": "Web + Local Documents"}
	return {"source": "Local Documents Only"}

	def generation_node(state: AgentState):
	system_msg = f"You are a Tutor AI. Use this context: {state['context']}"
	response = chat_model.invoke([SystemMessage(content=system_msg)] + state["messages"])
	cleaned = clean_response(response.content)
	return {"messages": [AIMessage(content=f"{cleaned}\n\n(Verified via: {state['source']})")]}

	workflow = StateGraph(AgentState)
	workflow.add_node("sense", sensing_node)
	workflow.add_node("expand", expansion_node)
	workflow.add_node("generate", generation_node)
	workflow.set_entry_point("sense")
	workflow.add_edge("sense", "expand")
	workflow.add_edge("expand", "generate")
	workflow.add_edge("generate", END)
	app_agent = workflow.compile()

	# --- 5. GRADIO APP WITH MANUAL AUDIO ---

	# Store last assistant response globally (simple approach for demo)
	last_assistant_response = ""

	def chat_handler(user_input, chat_history):
	global last_assistant_response
	if not user_input:
	return chat_history, "", None

	inputs = {"messages": [HumanMessage(content=user_input)], "context": "", "decision": "", "source": ""}
	result = app_agent.invoke(inputs)
	final_msg = result["messages"][-1].content

	chat_history.append({"role": "user", "content": user_input})
	chat_history.append({"role": "assistant", "content": final_msg})

	# Save clean text for later TTS (without source note)
	last_assistant_response = final_msg.split("*(Verified")[0].strip()

	# Return chat history and clear audio (no autoplay)
	return chat_history, "", None

	def generate_audio():
	global last_assistant_response
	if not last_assistant_response:
	return None
	return speech_playback(last_assistant_response)

	def upload_file(file):
	if file is None:
	return "❌ No file uploaded."
	try:
	success = extract_and_store_document(file.name)
	if success:
	return f"✅ {os.path.basename(file.name)} successfully parsed and added to knowledge base!"
	else:
	return f"⚠️ Failed to extract text from {os.path.basename(file.name)}."
	except Exception as e:
	return f"❌ Error: {str(e)}"

	with gr.Blocks() as demo:
	gr.Markdown("# 🎓 REFRAG Multi-Agent Tutor")

	with gr.Tab("AI Chatbot"):
	#chatbot = gr.Chatbot(type="messages", height=400)
	chatbot = gr.Chatbot(value=[], height=400)
	with gr.Row():
	msg = gr.Textbox(placeholder="Ask your tutor...", scale=4)
	submit = gr.Button("Send", variant="primary")
	# Manual audio control
	with gr.Row():
	play_audio_btn = gr.Button("🔊 Play Audio Response", variant="secondary")
	audio_out = gr.Audio(label="Audio Response", autoplay=False) # autoplay=False

	# Chat submission
	submit.click(chat_handler, [msg, chatbot], [chatbot, msg, audio_out])
	msg.submit(chat_handler, [msg, chatbot], [chatbot, msg, audio_out])
	# Manual audio generation
	play_audio_btn.click(generate_audio, None, audio_out)

	with gr.Tab("Upload Notes"):
	file_input = gr.File(label="Upload PDF / DOCX / PPTX / TXT", file_types=[".pdf", ".docx", ".pptx", ".txt"])
	upload_status = gr.Markdown()
	file_input.change(upload_file, file_input, upload_status)

	demo.launch(share=True, debug=True)