Spaces:

lei0lei
/

chat-pdf

Sleeping

chat-pdf / chain.py

d5f54fe over 2 years ago

4.93 kB

	import os
	from langchain.embeddings.openai import OpenAIEmbeddings
	from langchain.text_splitter import CharacterTextSplitter
	from langchain.vectorstores import Chroma
	from langchain.chains import ConversationalRetrievalChain
	from langchain.chat_models import ChatOpenAI
	from langchain.document_loaders import PyPDFLoader
	import fitz
	from PIL import Image
	import gradio as gr
	import structlog
	from langchain.text_splitter import RecursiveCharacterTextSplitter

	logger = structlog.get_logger()
	# Global variables
	count = 0
	n = 0
	chat_history = []
	chain = ''


	# Select llm models


	# Select multi-loaders

	# Select embedding models

	# Select vector stores

	# Select retrivers

	# Sample chat chain

	# Sample chat stream chain


	# Sample retriver chain


	# Sample pdf doc conversation chain



	# Function to set the OpenAI API key
	def set_api_key(api_key):
	"""
	Sets the OpenAI API key in the environment variable.

	Args:
	api_key (str): The OpenAI API key.

	Returns:
	str: Message indicating the API key is set.
	"""
	os.environ['OPENAI_API_KEY'] = api_key
	print(f'==========API KEY SETUP==========')
	return 'OpenAI API key is set'

	# Function to enable the API key input box
	def enable_api_box():
	"""
	Enables the API key input box.

	Returns:
	None
	"""
	return

	# Function to add text to the chat history
	def add_text(history, text):
	"""
	Adds the user's input text to the chat history.

	Args:
	history (list): List of tuples representing the chat history.
	text (str): The user's input text.

	Returns:
	list: Updated chat history with the new user input.
	"""
	if not text:
	raise gr.Error('Enter text')
	history.append((text, ''))
	return history

	# Function to process the PDF file and create a conversation chain
	def process_file(file):
	"""
	Processes the uploaded PDF file and creates a conversational retrieval chain.

	Args:
	file (FileStorage): The uploaded PDF file.

	Returns:
	ConversationalRetrievalChain: The created conversational retrieval chain.
	"""
	if 'OPENAI_API_KEY' not in os.environ:
	raise gr.Error('Upload your OpenAI API key')

	loader = PyPDFLoader(file.name)
	documents = loader.load()


	text_splitter = RecursiveCharacterTextSplitter(
	chunk_size=1500,
	chunk_overlap=200
	)
	splits = text_splitter.split_documents(documents)

	embeddings = OpenAIEmbeddings()

	pdf_search = Chroma.from_documents(splits, embeddings)

	chain = ConversationalRetrievalChain.from_llm(ChatOpenAI(temperature=0.3),
	retriever=pdf_search.as_retriever(search_type='mmr',
	search_kwargs={'k':2, 'fetch_k':4}),
	return_source_documents=True)
	return chain,pdf_search

	# Function to generate a response based on the chat history and query
	def generate_response(history, query, btn):
	"""
	Generates a response based on the chat history and user's query.

	Args:
	history (list): List of tuples representing the chat history.
	query (str): The user's query.
	btn (FileStorage): The uploaded PDF file.

	Returns:
	tuple: Updated chat history with the generated response and the next page number.
	"""
	global count, n, chat_history, chain,pdf_search

	if not btn:
	raise gr.Error(message='Upload a PDF')
	if count == 0:
	chain,pdf_search = process_file(btn)
	count += 1

	result = chain({"question": query, 'chat_history': chat_history}, return_only_outputs=True)
	logger.info(f'Retrievaled docs to send to llm: {result.get("source_documents", [])}')
	logger.info(f'====================')
	chat_history.append((query, result["answer"]))
	logger.info(f'Result from llm: {result["answer"]}')
	logger.info(f'===================')
	docs = pdf_search.as_retriever(search_type='mmr',
	search_kwargs={'k':1}).get_relevant_documents(query=result["answer"])

	logger.info(f'Result conclude from: {docs}')
	n = list(result['source_documents'][0])[1][1]['page']

	for char in result['answer']:
	history[-1][-1] += char
	return history, " "

	# Function to render a specific page of a PDF file as an image
	def render_file(file):
	"""
	Renders a specific page of a PDF file as an image.

	Args:
	file (FileStorage): The PDF file.

	Returns:
	PIL.Image.Image: The rendered page as an image.
	"""
	global n
	doc = fitz.open(file.name)
	page = doc[n]
	# Render the page as a PNG image with a resolution of 300 DPI
	pix = page.get_pixmap(matrix=fitz.Matrix(300 / 72, 300 / 72))
	image = Image.frombytes('RGB', [pix.width, pix.height], pix.samples)
	return image