Spaces:

Rehman1603
/

Chat_with_Document

Build error

App Files Files Community

Rehman1603 commited on May 28, 2024

Commit

f8f842e

verified ·

1 Parent(s): 9c996d7

Upload llm_model.py

Browse files

Files changed (1) hide show

llm_model.py +133 -0

llm_model.py ADDED Viewed

	@@ -0,0 +1,133 @@

+from langchain.vectorstores import FAISS
+#from langchain.llms import GooglePalm, CTransformers
+from langchain.document_loaders import PyPDFLoader, TextLoader, Docx2txtLoader
+from langchain.embeddings import HuggingFaceEmbeddings, HuggingFaceInstructEmbeddings
+from langchain.prompts import PromptTemplate
+from langchain.chains import RetrievalQA
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+from huggingface_hub import InferenceClient
+from langdetect import detect  # Language detection
+import os
+from dotenv import load_dotenv
+vector_index_path = "assets/vectordb/faiss_index"
+class LlmModel:
+    def __init__(self):
+        # load dot env variables
+        self.load_env_variables()
+        # load llm model
+        self.hf_embeddings = self.load_huggingface_embeddings()
+    def load_env_variables(self):
+        load_dotenv()  # take environment variables from .env
+    def detect_language(self, text):
+        try:
+            return detect(text)
+        except:
+            return "en"  # Default to English if detection fails
+    def generate_response(self, question, context):
+        language = self.detect_language(question)
+        model_id = "mistralai/Mistral-7B-Instruct-v0.1"
+        inputs = {
+            "inputs": {
+                "question": question,
+                "context": context,
+            }
+        }
+    def custom_prompt(self, question, history, context):
+        #RAG prompt template
+        prompt = "<s>"
+        for user_prompt, bot_response in history: # provide chat history
+            prompt += f"[INST] {user_prompt} [/INST]"
+            prompt += f" {bot_response}</s>"
+        message_prompt = f"""
+        You are a question answer agent and you must strictly follow below prompt template.
+        Given the following context and a question, generate an answer based on this context only.
+        Keep answers brief and well-structured. Do not give one word answers.
+        If the answer is not found in the context, kindly state "I don't know." Don't try to make up an answer.
+        CONTEXT: {context}
+        QUESTION: {question}
+        """
+        prompt += f"[INST] {message_prompt} [/INST]"
+        return prompt
+    def format_sources(self, sources):
+        # format the document sources
+        source_results = []
+        for source in sources:
+            source_results.append(str(source.page_content) +
+                                  "\n Document: " + str(source.metadata['source']) +
+                                  " Page: " + str(source.metadata['page']))
+        return source_results
+    def mixtral_chat_inference(self, prompt, history, temperature, top_p, repetition_penalty, retriever):
+        context = retriever.get_relevant_documents(prompt)
+        sources = self.format_sources(context)
+        # use hugging face infrence api
+        client = InferenceClient("mistralai/Mistral-7B-Instruct-v0.1",
+                                    token=os.environ["HF_TOKEN"]
+                                )
+        temperature = float(temperature)
+        if temperature < 1e-2:
+            temperature = 1e-2
+        generate_kwargs = dict(
+                            temperature = temperature,
+                            max_new_tokens = 512,
+                            top_p = top_p,
+                            repetition_penalty = repetition_penalty,
+                            do_sample = True
+                            )
+        formatted_prompt = self.custom_prompt(prompt, history, context)
+        return client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False), sources
+    def load_huggingface_embeddings(self):
+        # Initialize instructor embeddings using the Hugging Face model
+        #return HuggingFaceInstructEmbeddings(model_name="hkunlp/instructor-large")
+        return HuggingFaceEmbeddings(model_name = "sentence-transformers/all-MiniLM-L6-v2",
+                                     model_kwargs={'device': 'cpu'})
+    def create_vector_db(self, filename):
+        if filename.endswith(".pdf"):
+            loader = PyPDFLoader(file_path=filename)
+        elif filename.endswith(".doc") or filename.endswith(".docx"):
+            loader = Docx2txtLoader(filename)
+        elif filename.endswith("txt") or filename.endswith("TXT"):
+            loader = TextLoader(filename)
+        # Split documents
+        text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=50)
+        splits = text_splitter.split_documents(loader.load())
+        # Check if splits list is empty
+        if not splits:
+            raise ValueError('No content to index. The document may be empty or not properly formatted.')
+        # Create a FAISS instance for vector database from 'data'
+        vectordb = FAISS.from_documents(documents = splits,
+                                        embedding = self.hf_embeddings)
+        # Save vector database locally
+        #vectordb.save_local(vector_index_path)
+        # set vectordb content
+        # Load the vector database from the local folder
+        #vectordb = FAISS.load_local(vector_index_path, self.hf_embeddings)
+        # Create a retriever for querying the vector database
+        return vectordb.as_retriever(search_type="similarity")