Spaces:

Darshika94
/

Document_Summarization

Build error

App Files Files Community

Darshika94 commited on Nov 24, 2024

Commit

d19b243

verified ·

1 Parent(s): 8b79a4c

Create app.py

Browse files

Files changed (1) hide show

app.py +236 -0

app.py ADDED Viewed

	@@ -0,0 +1,236 @@

+import streamlit as st
+from langchain_core.messages import AIMessage, HumanMessage
+from langchain_core.prompts import MessagesPlaceholder
+from langchain_ollama import ChatOllama
+from langchain_openai import ChatOpenAI
+from langchain_core.output_parsers import StrOutputParser
+from langchain_core.prompts import ChatPromptTemplate, PromptTemplate
+import torch
+from langchain_huggingface import ChatHuggingFace
+from langchain_huggingface  import HuggingFaceEndpoint
+import faiss
+import tempfile
+import os
+import time
+from langchain_community.vectorstores import FAISS
+from langchain_huggingface import HuggingFaceEmbeddings
+from langchain_text_splitters import RecursiveCharacterTextSplitter
+from langchain.chains import create_history_aware_retriever, create_retrieval_chain
+from langchain.chains.combine_documents import create_stuff_documents_chain
+from langchain_community.document_loaders import PyPDFLoader
+from dotenv import load_dotenv
+load_dotenv()
+# Streamlit Settings
+st.set_page_config(page_title="Chat with documents 📚", page_icon="📚")
+st.title("Chat with documents 📚")
+# Subtitle
+st.subheader("Ask questions and get answers from your documents 💬") #newline-d
+#new in progress
+#
+model_class = "hf_hub" # @param ["hf_hub", "openai", "ollama"]
+## Model Providers
+def model_hf_hub(model="meta-llama/Meta-Llama-3-8B-Instruct", temperature=0.1):
+  llm = HuggingFaceEndpoint(
+      repo_id=model,
+      temperature=temperature,
+      max_new_tokens=512,
+      return_full_text=False,
+      #model_kwargs={
+      #    "max_length": 64,
+      #    #"stop": ["<|eot_id|>"],
+      #}
+  )
+  return llm
+def model_openai(model="gpt-4o-mini", temperature=0.1):
+    llm = ChatOpenAI(
+        model=model,
+        temperature=temperature
+        # other parameters...
+    )
+    return llm
+def model_ollama(model="phi3", temperature=0.1):
+    llm = ChatOllama(
+        model=model,
+        temperature=temperature,
+    )
+    return llm
+## Indexing and Retrieval
+def config_retriever(uploads):
+    # Load
+    docs = []
+    temp_dir = tempfile.TemporaryDirectory()
+    for file in uploads:
+        temp_filepath = os.path.join(temp_dir.name, file.name)
+        with open(temp_filepath, "wb") as f:
+            f.write(file.getvalue())
+        loader = PyPDFLoader(temp_filepath)
+        docs.extend(loader.load())
+    # Split
+    text_splitter = RecursiveCharacterTextSplitter(
+        chunk_size=1000,
+        chunk_overlap=200
+    )
+    splits = text_splitter.split_documents(docs)
+    # Embeddings
+    embeddings = HuggingFaceEmbeddings(model_name="BAAI/bge-m3")
+    # Store
+    vectorstore = FAISS.from_documents(splits, embeddings)
+    vectorstore.save_local('vectorstore/db_faiss')
+    # Retrieve
+    retriever = vectorstore.as_retriever(
+        search_type='mmr',
+        search_kwargs={'k':3, 'fetch_k':4}
+    )
+    return retriever
+def config_rag_chain(model_class, retriever):
+    ### Loading the LLM
+    if model_class == "hf_hub":
+        llm = model_hf_hub()
+    elif model_class == "openai":
+        llm = model_openai()
+    elif model_class == "ollama":
+        llm = model_ollama()
+    # Prompt definition
+    if model_class.startswith("hf"):
+        token_s, token_e = "<|begin_of_text|><|start_header_id|>system<|end_header_id|>", "<|eot_id|><|start_header_id|>assistant<|end_header_id|>"
+    else:
+        token_s, token_e = "", ""
+    # Contextualization prompt
+    context_q_system_prompt = "Given the following chat history and the follow-up question which might reference context in the chat history, formulate a standalone question which can be understood without the chat history. Do NOT answer the question, just reformulate it if needed and otherwise return it as is."
+    context_q_system_prompt = token_s + context_q_system_prompt
+    context_q_user_prompt = "Question: {input}" + token_e
+    context_q_prompt = ChatPromptTemplate.from_messages(
+        [
+            ("system", context_q_system_prompt),
+            MessagesPlaceholder("chat_history"),
+            ("human", context_q_user_prompt),
+        ]
+    )
+    # Chain for contextualization
+    history_aware_retriever = create_history_aware_retriever(
+        llm=llm, retriever=retriever, prompt=context_q_prompt
+    )
+    # Q&A Prompt
+    qa_prompt_template = """You are a helpful virtual assistant answering general questions.
+Use the following bits of retrieved context to answer the question.
+If you don't know the answer, just say you don't know. Keep your answer concise.
+Answer in English. \n\n
+    Question: {input} \n
+    Context: {context}"""
+    qa_prompt = PromptTemplate.from_template(token_s + qa_prompt_template + token_e)
+    # Configure LLM and Chain for Q&A
+    qa_chain = create_stuff_documents_chain(llm, qa_prompt)
+    rag_chain = create_retrieval_chain(
+        history_aware_retriever,
+        qa_chain,
+    )
+    return rag_chain
+## Creates side panel in the interface
+uploads = st.sidebar.file_uploader(
+    label="Upload files", type=["pdf"],
+    accept_multiple_files=True
+)
+if not uploads:
+    st.info("Please send some file to continue!")
+    st.stop()
+if "chat_history" not in st.session_state:
+    st.session_state.chat_history = [
+        AIMessage(content="Hi, I'm your virtual assistant! How can I help you?"),
+    ]
+if "docs_list" not in st.session_state:
+    st.session_state.docs_list = None
+if "retriever" not in st.session_state:
+    st.session_state.retriever = None
+for message in st.session_state.chat_history:
+    if isinstance(message, AIMessage):
+        with st.chat_message("AI"):
+            st.write(message.content)
+    elif isinstance(message, HumanMessage):
+        with st.chat_message("Human"):
+            st.write(message.content)
+# we use time to measure how long it took for generation
+start = time.time()
+user_query = st.chat_input("Enter your message here...")
+if user_query is not None and user_query != "" and uploads is not None:
+    st.session_state.chat_history.append(HumanMessage(content=user_query))
+    with st.chat_message("Human"):
+        st.markdown(user_query)
+    with st.chat_message("AI"):
+        if st.session_state.docs_list != uploads:
+            print(uploads)
+            st.session_state.docs_list = uploads
+            st.session_state.retriever = config_retriever(uploads)
+        rag_chain = config_rag_chain(model_class, st.session_state.retriever)
+        result = rag_chain.invoke({"input": user_query, "chat_history": st.session_state.chat_history})
+        resp = result['answer']
+        st.write(resp)
+        # show the source
+        sources = result['context']
+        for idx, doc in enumerate(sources):
+            source = doc.metadata['source']
+            file = os.path.basename(source)
+            page = doc.metadata.get('page', 'Page not specified')
+            ref = f":link: Source {idx}: *{file} - p. {page}*"
+            print(ref)
+            with st.popover(ref):
+                st.caption(doc.page_content)
+    st.session_state.chat_history.append(AIMessage(content=resp))
+end = time.time()
+print("Time: ", end - start)