Spaces:

SAVAI123
/

AIThing

Sleeping

SAVAI123 commited on Mar 16, 2025

Commit

06dc72e

verified ·

1 Parent(s): 58cf20f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -60,7 +60,7 @@ def initialize_retriever():
         print(f"Successfully loaded {len(documents)} pages from the PDF")
         # Split text into chunks
-        text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=10)
         text_chunks = text_splitter.split_documents(documents)
         print(f"Split into {len(text_chunks)} text chunks")
@@ -70,7 +70,7 @@ def initialize_retriever():
         # Store embeddings in FAISS index
         vectorstore = FAISS.from_documents(text_chunks, embeddings)
         print("Successfully created vector store")
-        return vectorstore.as_retriever(search_kwargs={"k": 4})
     except Exception as e:
         print(f"Error in initialize_retriever: {str(e)}")

         print(f"Successfully loaded {len(documents)} pages from the PDF")
         # Split text into chunks
+        text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=150)
         text_chunks = text_splitter.split_documents(documents)
         print(f"Split into {len(text_chunks)} text chunks")
         # Store embeddings in FAISS index
         vectorstore = FAISS.from_documents(text_chunks, embeddings)
         print("Successfully created vector store")
+        return vectorstore.as_retriever(search_kwargs={"k": 10})
     except Exception as e:
         print(f"Error in initialize_retriever: {str(e)}")