Spaces:

Hk4crprasad
/

Test

Sleeping

App Files Files Community

Hk4crprasad commited on Jan 23, 2024

Commit

4124846

verified ·

1 Parent(s): 3334b36

Upload 3 files

Browse files

Files changed (2) hide show

app.py +93 -2
requirements.txt +7 -1

app.py CHANGED Viewed

@@ -11,8 +11,77 @@ from google.generativeai.types.generation_types import (
     BlockedPromptException,
     BrokenResponseError
 )
 load_dotenv()
 import datetime
 url = "https://y39t47-8080.csb.app/search"
 weathe_key = os.getenv("WEATHER_KEY")
@@ -675,6 +744,10 @@ with cols[2]:
 with cols[3]:
     graphviz_mode = st.toggle("Graphviz mode", value=False, help="Activate this mode to generate a graph with graphviz in .dot from your message")
 if image_atachment:
     image = st.file_uploader("Upload your image", type=['png', 'jpg', 'jpeg'])
     url = st.text_input("Or paste your image url")
@@ -685,7 +758,7 @@ else:
 if txt_atachment:
-    txtattachment = st.file_uploader("Upload your text file", type=['txt'])
 else:
     txtattachment = None
@@ -694,7 +767,25 @@ if csv_excel_atachment:
 else:
     csvexcelattachment = None
-prompt = st.chat_input("Write your message")
 if prompt:
     txt = ''

     BlockedPromptException,
     BrokenResponseError
 )
+from PyPDF2 import PdfReader
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+import os
+from langchain_google_genai import GoogleGenerativeAIEmbeddings
+import google.generativeai as genai
+from langchain.vectorstores import FAISS
+from langchain_google_genai import ChatGoogleGenerativeAI
+from langchain.chains.question_answering import load_qa_chain
+from langchain.prompts import PromptTemplate
 load_dotenv()
 import datetime
+def get_pdf_text(pdf_docs):
+    text=""
+    for pdf in pdf_docs:
+        pdf_reader= PdfReader(pdf)
+        for page in pdf_reader.pages:
+            text+= page.extract_text()
+    return  text
+def get_text_chunks(text):
+    text_splitter = RecursiveCharacterTextSplitter(chunk_size=10000, chunk_overlap=1000)
+    chunks = text_splitter.split_text(text)
+    return chunks
+def get_vector_store(text_chunks):
+    embeddings = GoogleGenerativeAIEmbeddings(model = "models/embedding-001")
+    vector_store = FAISS.from_texts(text_chunks, embedding=embeddings)
+    vector_store.save_local("faiss_index")
+def get_conversational_chain():
+    prompt_template = """
+    Try always to answer only available in the context and please always give perfect answer from the available context , if i say Summerize then Summerize , and if ask key points then give the key points, if i ask who are you then answer 'i am BHAI(Best High-Quality Artificial Intelligence) Made by hk4crprasad' and always give the perfect and correct output, if i say that tell me more about something in the context then tell accordingly.,
+    Context:\n {context}?\n
+    Question: \n{question}\n
+    Answer:
+    """
+    model = ChatGoogleGenerativeAI(model="gemini-pro",
+                             temperature=0.5)
+    prompt = PromptTemplate(template = prompt_template, input_variables = ["context", "question"])
+    chain = load_qa_chain(model, chain_type="stuff", prompt=prompt)
+    return chain
+def user_input(user_question):
+    embeddings = GoogleGenerativeAIEmbeddings(model = "models/embedding-001")
+    new_db = FAISS.load_local("faiss_index", embeddings)
+    docs = new_db.similarity_search(user_question)
+    chain = get_conversational_chain()
+    pdfans = chain(
+        {"input_documents":docs, "question": user_question}
+        , return_only_outputs=True)
+    return pdfans["output_text"]
 url = "https://y39t47-8080.csb.app/search"
 weathe_key = os.getenv("WEATHER_KEY")
 with cols[3]:
     graphviz_mode = st.toggle("Graphviz mode", value=False, help="Activate this mode to generate a graph with graphviz in .dot from your message")
+with cols[4]:
+    pdf_mode = st.toggle("Pdf ask mode", value=False, help="Activate this mode to generate a graph with graphviz in .dot from your message")
 if image_atachment:
     image = st.file_uploader("Upload your image", type=['png', 'jpg', 'jpeg'])
     url = st.text_input("Or paste your image url")
 if txt_atachment:
+    txtattachment = st.file_uploader("Upload your text file", type=['txt, py, go, java, php, etc'])
 else:
     txtattachment = None
 else:
     csvexcelattachment = None
+if pdf_mode:
+    pdf_docs = st.file_uploader("Upload your PDF Files and Click on the Submit & Process Button", type=['pdf'])
+    if st.button("Submit & Process"):
+        with st.spinner("Processing..."):
+            raw_text = get_pdf_text(pdf_docs)
+            text_chunks = get_text_chunks(raw_text)
+            get_vector_store(text_chunks)
+            st.success("Done")
+else:
+    pdf_docs = None
+if pdf_docs:
+    prompt = st.chat_input("Write your questions according to the pdf")
+    if prompt:
+        prmt  = {'role': 'user', 'parts':[prompt]}
+        usertxt = user_input(prompt)
+        append_message({'role': 'model', 'parts':usertxt})
+else:
+    prompt = st.chat_input("Write your message")
 if prompt:
     txt = ''

requirements.txt CHANGED Viewed

@@ -1,4 +1,10 @@
 google-generativeai
 pandas
 numpy
-python-dotenv==1.0.0

 google-generativeai
 pandas
 numpy
+python-dotenv==1.0.0
+langchain
+PyPDF2
+chromadb
+faiss-cpu
+langchain_google_genai
+langchain-community