insurance-chatbot / utils.py
skanda12's picture
Update utils.py
f4d9a6d verified
raw
history blame contribute delete
238 Bytes
import fitz # PyMuPDF
def extract_text_from_pdf(file):
"""Extract plain text from a PDF file using PyMuPDF."""
with fitz.open(stream=file.read(), filetype="pdf") as doc:
return "\n".join(page.get_text() for page in doc)