Spaces:

techconspartners
/

ConversAI

Sleeping

Rauhan commited on Aug 21, 2024

Commit

d22b8e9

1 Parent(s): 39cf044

DEBUG: FlashRank

Files changed (1) hide show

functions.py CHANGED Viewed

@@ -198,15 +198,11 @@ def answerQuery(query: str, vectorstore: str, llmModel: str = "llama3-70b-8192")
         vectorstore=vectorstore,
         docstore=store,
         child_splitter=RecursiveCharacterTextSplitter(),
-        search_kwargs={"k": 20}
-    )
-    compressor = FlashrankRerank()
-    retriever = ContextualCompressionRetriever(
-        base_compressor=compressor, base_retriever=retriever
     )
     baseChain = (
             {"context": RunnableLambda(lambda x: x["question"]) | retriever | RunnableLambda(format_docs),
-             "question": RunnablePassthrough(), "chatHistory": RunnablePassthrough()}
             | prompt
             | ChatGroq(model=llmModel, temperature=0.75, max_tokens=512)
             | StrOutputParser()
@@ -289,7 +285,7 @@ def getLinks(url: str, timeout=30):
 def getTextFromImagePDF(pdfBytes):
     def getText(image):
         global reader
-        return "\n".join([text[1] for text in reader.readtext(np.array(image), paragraph=True)])
     allImages = convert_from_bytes(pdfBytes)
     texts = [getText(image) for image in allImages]
     return "\n\n\n".join(texts)

         vectorstore=vectorstore,
         docstore=store,
         child_splitter=RecursiveCharacterTextSplitter(),
+        search_kwargs={"k": 4, "score_threshold": 0}
     )
     baseChain = (
             {"context": RunnableLambda(lambda x: x["question"]) | retriever | RunnableLambda(format_docs),
+             "question": RunnableLambda(lambda x: x["question"]), "chatHistory": RunnableLambda(lambda x: x["chatHistory"])}
             | prompt
             | ChatGroq(model=llmModel, temperature=0.75, max_tokens=512)
             | StrOutputParser()
 def getTextFromImagePDF(pdfBytes):
     def getText(image):
         global reader
+        return "\n".join([text[1] for text in reader.readtext(np.array(image), paragraph=True, x_ths = 0)])
     allImages = convert_from_bytes(pdfBytes)
     texts = [getText(image) for image in allImages]
     return "\n\n\n".join(texts)