Spaces:

yashpinjarkar10
/

WebChat

Runtime error

App Files Files Community

WebChat / app.py

yashpinjarkar10

Upload 9 files

7cf3b7f verified about 1 year ago

raw

history blame contribute delete

4.74 kB

	from fastapi import FastAPI, HTTPException
	from pydantic import BaseModel
	from typing import List, Union
	import os
	from langchain.chains.combine_documents import create_stuff_documents_chain
	from langchain.chains.history_aware_retriever import create_history_aware_retriever
	from langchain.chains.retrieval import create_retrieval_chain
	from langchain_chroma import Chroma
	from langchain_core.messages import SystemMessage, HumanMessage, AIMessage
	from langchain_core.prompts import ChatPromptTemplate, MessagesPlaceholder
	from langchain_google_genai import GoogleGenerativeAIEmbeddings, ChatGoogleGenerativeAI
	from dotenv import load_dotenv
	from starlette.middleware.cors import CORSMiddleware

	load_dotenv()
	GOOGLE_API_KEY = os.getenv("GOOGLE_API_KEY")

	# Define the persistent directory
	current_dir = os.path.dirname(os.path.abspath(__file__))
	persistent_directory = os.path.join(current_dir, "db", "chroma_db")

	# Initialize embeddings
	embeddings = GoogleGenerativeAIEmbeddings(model="models/embedding-001", api_key=GOOGLE_API_KEY)

	# Load the existing vector store with the embedding function
	db = Chroma(persist_directory=persistent_directory, embedding_function=embeddings)

	# Create a retriever for querying the vector store
	retriever = db.as_retriever(search_type="similarity", search_kwargs={"k": 5})

	# Initialize the LLM
	llm = ChatGoogleGenerativeAI(model="gemini-1.5-flash", api_key=GOOGLE_API_KEY)

	# Contextualize question prompt
	contextualize_q_system_prompt = (
	"Given a chat history and the latest user question "
	"which might reference context in the chat history, "
	"formulate a standalone question which can be understood "
	"without the chat history. Do NOT answer the question, just "
	"reformulate it if needed and otherwise return it as is."
	)

	contextualize_q_prompt = ChatPromptTemplate.from_messages(
	[
	("system", contextualize_q_system_prompt),
	MessagesPlaceholder("chat_history"),
	("human", "{input}"),
	]
	)

	# Create a history-aware retriever
	history_aware_retriever = create_history_aware_retriever(llm, retriever, contextualize_q_prompt)

	# Answer question prompt
	# Update this prompt to reflect your desired behavior (e.g., act as "you")
	qa_system_prompt = (
	"You are an assistant that acts as me. Use the following pieces of retrieved context "
	"to answer the question. If you don't know the answer, just say that you don't know. "
	"Use three sentences maximum and keep the answer concise. Always respond as if you are me."
	"\n\n"
	"{context}"
	)

	qa_prompt = ChatPromptTemplate.from_messages(
	[
	("system", qa_system_prompt),
	MessagesPlaceholder("chat_history"),
	("human", "{input}"),
	]
	)

	# Create a chain to combine documents for question answering
	question_answer_chain = create_stuff_documents_chain(llm, qa_prompt)

	# Create a retrieval chain that combines the history-aware retriever and the question answering chain
	rag_chain = create_retrieval_chain(history_aware_retriever, question_answer_chain)

	app = FastAPI()

	# Global chat history
	chat_history = []

	class ChatRequest(BaseModel):
	input: str

	class ChatResponse(BaseModel):
	answer: str
	# Enable CORS to allow frontend access
	app.add_middleware(
	CORSMiddleware,
	allow_origins=["*"],
	allow_credentials=True,
	allow_methods=["*"],
	allow_headers=["*"],
	)

	# Home route to check if FastAPI is running
	@app.get("/")
	async def root():
	return {"message": "FastAPI Server is Running!"}
	@app.post("/start")
	async def start_chat():
	global chat_history
	chat_history = [] # Reset chat history
	return {"message": "Chat session started. Chat history has been reset."}

	@app.post("/chat", response_model=ChatResponse)
	async def chat(chat_request: ChatRequest):
	global chat_history

	query = chat_request.input

	if query.lower() == "exit":
	raise HTTPException(status_code=400, detail="Use /start to reset the chat session.")

	# Filter out SystemMessage, keeping only HumanMessage and AIMessage
	filtered_chat_history = [
	msg for msg in chat_history if isinstance(msg, HumanMessage) or isinstance(msg, AIMessage)
	]

	# Invoke the RAG chain
	result = rag_chain.invoke({"input": query, "chat_history": filtered_chat_history})

	# Update the chat history
	chat_history.append(HumanMessage(content=query))
	chat_history.append(AIMessage(content=result['answer']))

	return ChatResponse(answer=result['answer'])

	# Run the FastAPI app
	if __name__ == "__main__":
	import uvicorn
	uvicorn.run(app, host="0.0.0.0", port=8080)