import streamlit as st from dotenv import load_dotenv from PyPDF2 import PdfReader def get_pdf_text(pdf_docs): text = "" for pdf in pdf_docs: pdf_reader = PdfReader(pdf) for page in pdf_reader.pages: text += page.extract_text() return text def main(): load_dotenv() st.set_page_config(page_title="Chat with Multiple PDFs", page_icon=":books:") st.header("Chat with Multiple PDFs (Made by Badr)") query = st.text_input("Ask a question about your documents:") with st.sidebar: st.subheader("Your Documents") pdf_docs = st.file_uploader("Upload your PDFs and click on 'Process'", accept_multiple_files=True) if st.button("Process"): with st.spinner("Processing..."): # Get PDF text raw_text = get_pdf_text(pdf_docs) st.write(raw_text) # Further processing steps can be added here (e.g., text chunking, creating vector store) if __name__ == '__main__': main()